Mock Version: 6.1 Mock Version: 6.1 Mock Version: 6.1 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'], chrootPath='/var/lib/mock/f42-build-58881909-6568954/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c75cjv4m:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c75cjv4m:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', '1f6ca8b2ad93490abc58299bcdd9b180', '-D', '/var/lib/mock/f42-build-58881909-6568954/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c75cjv4m:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1737158400 Wrote: /builddir/build/SRPMS/rccl-6.3.0-3.fc42.src.rpm Child return code was: 0 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'], chrootPath='/var/lib/mock/f42-build-58881909-6568954/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c75cjv4m:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c75cjv4m:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', '40222f2bae8e47c2993ff7c891377e88', '-D', '/var/lib/mock/f42-build-58881909-6568954/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c75cjv4m:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1737158400 Executing(%mkbuilddir): /bin/sh -e /var/tmp/rpm-tmp.kke1Co Executing(%prep): /bin/sh -e /var/tmp/rpm-tmp.H7lcw9 + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + cd /builddir/build/BUILD/rccl-6.3.0-build + rm -rf rccl-rocm-6.3.0 + /usr/lib/rpm/rpmuncompress -x /builddir/build/SOURCES/RCCL-6.3.0.tar.gz + STATUS=0 + '[' 0 -ne 0 ']' + cd rccl-rocm-6.3.0 + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w . + sed -i -e '/AMD GPU targets to compile for/d' CMakeLists.txt + sed -i -e 's@cat ${ROCM_PATH}/.info/version@echo 6.3.0@' CMakeLists.txt + sed -i -e s@rocm-core/rocm_version.h@rocm_version.h@ src/include/hip_rocm_version_info.h + RPM_EC=0 ++ jobs -p + exit 0 Executing(%build): /bin/sh -e /var/tmp/rpm-tmp.GkrKWz + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd rccl-rocm-6.3.0 + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + /usr/bin/cmake -S . -B redhat-linux-build -DCMAKE_C_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_CXX_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_Fortran_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_VERBOSE_MAKEFILE:BOOL=ON -DCMAKE_INSTALL_DO_STRIP:BOOL=OFF -DCMAKE_INSTALL_PREFIX:PATH=/usr -DCMAKE_INSTALL_FULL_SBINDIR:PATH=/usr/bin -DCMAKE_INSTALL_SBINDIR:PATH=bin -DINCLUDE_INSTALL_DIR:PATH=/usr/include -DLIB_INSTALL_DIR:PATH=/usr/lib64 -DSYSCONF_INSTALL_DIR:PATH=/etc -DSHARE_INSTALL_PREFIX:PATH=/usr/share -DLIB_SUFFIX=64 -DBUILD_SHARED_LIBS:BOOL=ON -DBUILD_TESTS=OFF -DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_CXX_COMPILER=/usr/bin/hipcc -DCMAKE_C_COMPILER=/usr/bin/hipcc -DCMAKE_EXPORT_COMPILE_COMMANDS=OFF -DCMAKE_SKIP_RPATH=ON -DBUILD_FILE_REORG_BACKWARD_COMPATIBILITY=OFF -DCMAKE_INSTALL_LIBDIR=/usr/lib64 -DROCM_SYMLINK_LIBS=OFF '-DAMDGPU_TARGETS=gfx90a:xnack+;gfx90a:xnack-;gfx1100;gfx1101;gfx1102;gfx1200;gfx1201' -DHIP_PLATFORM=amd -DRCCL_ROCPROFILER_REGISTER=OFF CMake Deprecation Warning at CMakeLists.txt:6 (cmake_minimum_required): Compatibility with CMake < 3.10 will be removed from a future version of CMake. Update the VERSION argument value. Or, use the ... syntax to tell CMake that the project requires at least but has been updated to work with policies introduced by or earlier. -- CMAKE_TOOLCHAIN_FILE: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/toolchain-linux.cmake -- The CXX compiler identification is Clang 18.0.0 -- Detecting CXX compiler ABI info -- Detecting CXX compiler ABI info - done -- Check for working CXX compiler: /usr/bin/hipcc - skipped -- Detecting CXX compile features -- Detecting CXX compile features - done -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- Checking for ROCm support for GPU targets: gfx90a:xnack+;gfx90a:xnack-;gfx1100;gfx1101;gfx1102;gfx1200;gfx1201 -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_on -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_on - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1101 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1101 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1102 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1102 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1200 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1200 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1201 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1201 - Success -- Compiling for gfx90a:xnack+;gfx90a:xnack-;gfx1100;gfx1101;gfx1102;gfx1200;gfx1201 -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- ROCM_PATH found: /opt/rocm -- Compiling with hipcc -- Performing Test CMAKE_HAVE_LIBC_PTHREAD -- Performing Test CMAKE_HAVE_LIBC_PTHREAD - Success -- Found Threads: TRUE -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS - Success -- HIP compiler: clang -- HIP runtime: rocclr -- hipcc executable: /usr/bin/hipcc sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory -- hipcc version: 6.3.42133 -- hipconfig executable: /usr/bin/hipconfig -- hipcc HIP version: 6.3.42133 -- ROCm version: 6.3.0 ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:87 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:191 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:88 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:191 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocUncached -- Looking for hipDeviceMallocUncached - found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:99 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:73 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:191 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocContiguous ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:87 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:194 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:88 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:194 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocContiguous - found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:99 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:73 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:194 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- RCCL LL128 protocol enabled -- HSA runtime: /usr/include -- Found rocm_smi at /usr/include -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h - found -- RSMI_INIT_FLAG_THRAD_ONLY_MUTEX supported -- Performing Test HAVE_KERNARG_PRELOAD -- Performing Test HAVE_KERNARG_PRELOAD - Success -- Kernarg preloading to SGPR enabled CMake Warning at CMakeLists.txt:301 (message): Can only build MSCCL++ for gfx942; disabling MSCCL++ build -- Found Python3: /usr/bin/python3.13 (found version "3.13.3") found components: Interpreter -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.h -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp -- HIP_CONTIGUOUS_MEMORY enabled -- HIP_UNCACHED_MEMORY enabled cat: /sys/fs/cgroup/memory/memory.limit_in_bytes: No such file or directory -- Use 1 jobs for linking -- Building shared RCCL library -- rocm-cmake: Set license file to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/LICENSE.txt. -- Configuring done (39.8s) -- Generating done (0.1s) CMake Warning: Manually-specified variables were not used by the project: CMAKE_CXX_FLAGS_RELEASE CMAKE_C_FLAGS_RELEASE CMAKE_Fortran_FLAGS_RELEASE CMAKE_INSTALL_DO_STRIP LIB_SUFFIX SHARE_INSTALL_PREFIX SYSCONF_INSTALL_DIR -- Build files have been written to: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build + /usr/bin/cmake --build redhat-linux-build -j6 --verbose Change Dir: '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' Run Build Command(s): /usr/bin/cmake -E env VERBOSE=1 /usr/bin/gmake -f Makefile -j6 /usr/bin/cmake -S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 -B/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build --check-build-system CMakeFiles/Makefile.cmake 0 /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build//CMakeFiles/progress.marks /usr/bin/gmake -f CMakeFiles/Makefile2 all gmake[1]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' cd /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles/git_version_check.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 0%] Updating git_version.cpp if necessary /usr/bin/cmake -P /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/git_version.cmake -- Updating git_version.cpp gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 0%] Built target git_version_check /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 1%] Hipifying src/transport/shm.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc [ 0%] Hipifying src/channel.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc [ 2%] Hipifying src/device/all_gather.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h [ 2%] Hipifying src/debug.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc [ 2%] Hipifying src/collectives.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc [ 1%] Hipifying src/bootstrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/shm.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/channel.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/bootstrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/collectives.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/debug.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/all_gather.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h [ 3%] Hipifying src/device/all_reduce.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h [ 3%] Hipifying src/device/alltoall_pivot.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/all_reduce.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/alltoall_pivot.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h [ 3%] Hipifying src/device/broadcast.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/broadcast.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h [ 3%] Hipifying src/device/common.cu -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/common.cu -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h [ 3%] Hipifying src/device/common.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/common.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h [ 4%] Hipifying src/device/common_kernel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/common_kernel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h [ 4%] Hipifying src/device/msccl_kernel_impl.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/msccl_kernel_impl.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h [ 4%] Hipifying src/device/network/unpack/unpack.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h [ 5%] Hipifying src/device/network/unpack/unpack_defs.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/network/unpack/unpack.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/network/unpack/unpack_defs.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h [ 5%] Hipifying src/device/onerank.cu -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/onerank.cu -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h [ 5%] Hipifying src/device/op128.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/op128.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h [ 5%] Hipifying src/device/primitives.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/primitives.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h [ 6%] Hipifying src/device/prims_ll.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/prims_ll.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h [ 6%] Hipifying src/device/prims_ll128.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/prims_ll128.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h [ 6%] Hipifying src/device/prims_simple.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/prims_simple.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h [ 6%] Hipifying src/device/reduce.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/reduce.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h [ 6%] Hipifying src/device/reduce_kernel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/reduce_kernel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h [ 7%] Hipifying src/device/reduce_scatter.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/reduce_scatter.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h [ 7%] Hipifying src/device/sendrecv.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/sendrecv.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h [ 7%] Hipifying src/enqueue.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/enqueue.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc [ 7%] Hipifying src/graph/connect.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/connect.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h [ 7%] Hipifying src/graph/paths.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/paths.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc [ 8%] Hipifying src/graph/rings.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rings.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc [ 8%] Hipifying src/graph/rings.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rings.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h [ 8%] Hipifying src/graph/rome_models.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rome_models.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc [ 8%] Hipifying src/graph/rome_models.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rome_models.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.h [ 9%] Hipifying src/graph/search.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/search.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc [ 9%] Hipifying src/graph/topo.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/topo.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc [ 9%] Hipifying src/graph/topo.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/topo.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h [ 9%] Hipifying src/graph/trees.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/trees.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc [ 10%] Hipifying src/graph/tuning.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/tuning.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc [ 10%] Hipifying src/graph/xml.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/xml.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc [ 10%] Hipifying src/graph/xml.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/xml.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h [ 10%] Hipifying src/group.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/group.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc [ 10%] Hipifying src/include/BfdBacktrace.hpp -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/BfdBacktrace.hpp -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp [ 10%] Hipifying src/include/align.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/align.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/align.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/align.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/align.h [ 11%] Hipifying src/include/alloc.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/alloc.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h [ 11%] Hipifying src/include/alt_rsmi.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alt_rsmi.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/alt_rsmi.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alt_rsmi.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alt_rsmi.h [ 11%] Hipifying src/include/api_trace.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/api_trace.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/api_trace.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/api_trace.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/api_trace.h [ 11%] Hipifying src/include/archinfo.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/archinfo.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/archinfo.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/archinfo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/archinfo.h [ 12%] Hipifying src/include/argcheck.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/argcheck.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h [ 12%] Hipifying src/include/bootstrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/bootstrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h [ 12%] Hipifying src/include/channel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/channel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h [ 13%] Hipifying src/include/checks.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/checks.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/checks.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/checks.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/checks.h [ 13%] Hipifying src/include/coll_net.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/coll_net.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h [ 13%] Hipifying src/include/collectives.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/collectives.h [ 13%] Hipifying src/include/comm.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/collectives.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/collectives.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/collectives.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/comm.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h [ 14%] Hipifying src/include/core.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/core.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h [ 14%] Hipifying src/include/cpuset.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/cpuset.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/cpuset.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/cpuset.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/cpuset.h [ 14%] Hipifying src/include/debug.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/debug.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/debug.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/debug.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/debug.h [ 14%] Hipifying src/include/device.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/device.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h [ 15%] Hipifying src/include/enqueue.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/enqueue.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h [ 15%] Hipifying src/include/gdrwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/gdrwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h [ 15%] Hipifying src/include/graph.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/graph.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h [ 15%] Hipifying src/include/git_version.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/git_version.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/git_version.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/git_version.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/git_version.h [ 16%] Hipifying src/include/group.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/group.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h [ 16%] Hipifying src/include/hip_rocm_version_info.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/hip_rocm_version_info.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h [ 16%] Hipifying src/include/ibvcore.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvcore.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ibvcore.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvcore.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvcore.h [ 16%] Hipifying src/include/ibvsymbols.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvsymbols.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ibvsymbols.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvsymbols.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvsymbols.h [ 17%] Hipifying src/include/ibvwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ibvwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h [ 17%] Hipifying src/include/info.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/info.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h [ 17%] Hipifying src/include/ipcsocket.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ipcsocket.h [ 17%] Hipifying src/include/msccl/msccl_kernel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ipcsocket.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ipcsocket.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ipcsocket.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_kernel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h [ 17%] Hipifying src/include/msccl/msccl_lifecycle.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_lifecycle.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h [ 18%] Hipifying src/include/msccl/msccl_parser.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_parser.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h [ 18%] Hipifying src/include/msccl/msccl_scheduler.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h [ 18%] Hipifying src/include/msccl/msccl_setup.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_setup.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_scheduler.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h [ 18%] Hipifying src/include/msccl/msccl_status.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_status.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h [ 19%] Hipifying src/include/msccl/msccl_struct.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_struct.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h [ 19%] Hipifying src/include/nccl_common.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_common.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nccl_common.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_common.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_common.h [ 20%] Hipifying src/include/nccl_net.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_net.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nccl_net.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_net.h [ 20%] Hipifying src/include/nccl_tuner.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_tuner.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nccl_tuner.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_tuner.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_tuner.h [ 20%] Hipifying src/include/net.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/net.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h [ 20%] Hipifying src/include/net_device.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net_device.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/net_device.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net_device.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net_device.h [ 20%] Hipifying src/include/npkit/npkit.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/npkit/npkit.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h [ 20%] Hipifying src/include/npkit/npkit_event.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_event.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/npkit/npkit_event.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_event.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_event.h [ 20%] Hipifying src/include/npkit/npkit_struct.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/npkit/npkit_struct.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h [ 21%] Hipifying src/include/nvmlwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvmlwrap.h [ 21%] Hipifying src/include/nvtx.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvmlwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvmlwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvmlwrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h [ 21%] Hipifying src/include/nvtx3/nvToolsExt.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExt.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtCuda.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtCuda.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtCudaRt.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtCudaRt.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtOpenCL.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtOpenCL.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtPayload.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtPayload.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtSync.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtSync.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h [ 23%] Hipifying src/include/nvtx3/nvtx3.hpp -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtx3.hpp -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp [ 23%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImpl.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImpl.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h [ 23%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCore.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplCore.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h [ 24%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h [ 24%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h [ 24%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInit.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxInit.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxTypes.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxTypes.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h [ 26%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h [ 26%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h [ 27%] Hipifying src/include/nvtx_stub.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx_stub.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx_stub.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx_stub.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx_stub.h [ 27%] Hipifying src/include/p2p.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/p2p.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/p2p.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/p2p.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/p2p.h [ 28%] Hipifying src/include/param.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/param.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/param.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/param.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/param.h [ 28%] Hipifying src/include/profiler.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/profiler.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h [ 28%] Hipifying src/include/proxy.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/proxy.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h [ 28%] Hipifying src/include/rccl_float8.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rccl_float8.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h [ 28%] Hipifying src/include/rccl_vars.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_vars.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rccl_vars.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_vars.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_vars.h [ 29%] Hipifying src/include/rocm_smi_wrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h [ 29%] Hipifying src/include/register.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/register.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/register.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/register.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/register.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rocm_smi_wrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h [ 29%] Hipifying src/include/rocmwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocmwrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rocmwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocmwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocmwrap.h [ 30%] Hipifying src/include/roctx.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/roctx.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h [ 30%] Hipifying src/include/shm.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/shm.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/shm.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/shm.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/shm.h [ 30%] Hipifying src/include/signals.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/signals.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/signals.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/signals.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/signals.h [ 30%] Hipifying src/include/socket.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/socket.h [ 31%] Hipifying src/include/strongstream.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/strongstream.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/strongstream.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/strongstream.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/strongstream.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/socket.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/socket.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/socket.h [ 31%] Hipifying src/include/timer.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/timer.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/timer.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/timer.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/timer.h [ 31%] Hipifying src/include/transport.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/transport.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h [ 32%] Hipifying src/include/trees.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/trees.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/trees.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/trees.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/trees.h [ 32%] Hipifying src/include/tuner.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/tuner.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/tuner.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/tuner.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/tuner.h [ 32%] Hipifying src/include/utils.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/utils.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h [ 33%] Hipifying src/init.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/init.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc [ 33%] Hipifying src/init_nvtx.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/init_nvtx.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc [ 34%] Hipifying src/misc/alt_rsmi.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/alt_rsmi.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc [ 34%] Hipifying src/misc/api_trace.c -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.c mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/api_trace.c -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.c && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.c [ 35%] Hipifying src/misc/api_trace.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/api_trace.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc [ 35%] Hipifying src/misc/archinfo.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/archinfo.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc [ 35%] Hipifying src/misc/argcheck.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/argcheck.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc [ 35%] Hipifying src/misc/ibvsymbols.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/ibvsymbols.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc [ 35%] Hipifying src/misc/ibvwrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/ibvwrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc [ 35%] Hipifying src/misc/msccl/msccl_lifecycle.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc [ 35%] Hipifying src/misc/ipcsocket.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc [ 35%] Hipifying src/misc/msccl/msccl_parser.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_lifecycle.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/ipcsocket.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_parser.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc [ 36%] Hipifying src/misc/msccl/msccl_setup.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_setup.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc [ 36%] Hipifying src/misc/msccl/msccl_status.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_status.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc [ 37%] Hipifying src/misc/npkit.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/npkit.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc [ 37%] Hipifying src/misc/nvmlwrap_stub.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/nvmlwrap_stub.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc [ 37%] Hipifying src/misc/param.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc [ 37%] Hipifying src/misc/profiler.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/param.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/profiler.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc [ 38%] Hipifying src/misc/rocm_smi_wrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc [ 38%] Hipifying src/misc/rocmwrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/rocm_smi_wrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/rocmwrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc [ 38%] Hipifying src/misc/roctx.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/roctx.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc [ 39%] Hipifying src/misc/shmutils.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/shmutils.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc [ 39%] Hipifying src/misc/signals.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/signals.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc [ 39%] Hipifying src/misc/socket.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/socket.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc [ 39%] Hipifying src/misc/strongstream.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/strongstream.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc [ 40%] Hipifying src/misc/tuner.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc [ 40%] Hipifying src/misc/utils.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/utils.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/tuner.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc [ 40%] Hipifying src/msccl.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/msccl.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc [ 40%] Hipifying src/net.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/net.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc [ 41%] Hipifying src/proxy.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/proxy.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc [ 41%] Hipifying src/register.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/register.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc [ 41%] Hipifying src/transport.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc [ 41%] Hipifying src/transport/coll_net.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/coll_net.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc [ 42%] Hipifying src/transport/net_ib.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/net_ib.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc [ 42%] Hipifying src/transport/net_socket.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/net_socket.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc [ 42%] Hipifying src/transport/net.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/net.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc [ 42%] Hipifying src/transport/nvls.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/nvls.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc [ 42%] Hipifying src/transport/p2p.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/p2p.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc cd /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles/rccl.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives.cc.o [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -MF CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc [ 43%] Building CXX object CMakeFiles/rccl.dir/hipify/src/group.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/group.cc.o -MF CMakeFiles/rccl.dir/hipify/src/group.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/group.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/channel.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/channel.cc.o -MF CMakeFiles/rccl.dir/hipify/src/channel.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/channel.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/debug.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/debug.cc.o -MF CMakeFiles/rccl.dir/hipify/src/debug.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/debug.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ : warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTyIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ peSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | con/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ stexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(stru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.ccct n:c128c:l38C:o mwarning: m*unused variable 'AllToAllvSchema' [-Wunused-variable] comm, int peer, int c128h | a n nceolnIsntce,x pirn tn vctoxlPla,y lionatd*ScchhaenmnaeElnItdr)y _{t A| l ^~~~~~~~~~~~~~~~~~l ToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:In file included from 23/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:: 9warning: : unused variable 'payload' [-Wunused-variable]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h: 161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | s132t | a t iNcv tgxdPra_rta mnscAclllGTdorAIlnlivt (p)a y{l o a| d ^~~~~~~~~~~{ sendcou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.hn:t209s:[21c:o mwarning: munused function 'ncclGdrCudaFree' [-Wunused-function]- >rank] * nc c209l | TsytpaetSiicz en(cdcaltRaetsyuplet)_,t rnecccvlcGodurnCtusd[acFormeme-(>vroaindk*] g*d rnHcacnldTlyep)e S{i z e| ( ^~~~~~~~~~~~~~~d atatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ lTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ 3 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int col/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ l, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ 1 warning generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payloa/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ d{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 31/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ 1 warning generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 1 warning generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.ccint:*249 :i38n:d exwarning: )unused variable 'ReduceSchema' [-Wunused-variable] { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function]249 | constexpr nvt x222P | asytlaotaidcS cnhcecmlaREensturlyt__tt RnecdculcTeoSpcohReamnak[T]o I=n d{e x (| s ^~~~~~~~~~~~t ruct n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.ccc:c255l:T20o:p owarning: Sunused variable 'payload' [-Wunused-variable]y stem* syste m255, | i nNtv trxaPnakr,a misnRte*d uicned epxa)y l{o a d| { ^~~~~~~~~~~~~~~~~~~c ount/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h :*233 :n21c:c lwarning: Tunused function 'ncclTopoDevToRank' [-Wunused-function]y peSize(datatype )233, | srtoaotti,c onpc}c;l R e| s ^~~~~~~u lt_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ y_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ ; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ 1 warning generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ 1 warning generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/init.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/init.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 3 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. 3 warnings generated when compiling for gfx1102. 31 warnings generated when compiling for gfx90a. 31 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ 31 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 17231 | warnings generated when compiling for gfx1201. void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 3 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 31 warnings generated when compiling for host. 31 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 31 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ Compute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 3 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc[ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/net.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/net.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc :399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ :506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} :610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc::399399::77:: warning: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable]variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399399 | | iinntt rrnnCChhaannnneellss == 00;; | | ^ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} 2 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/msccl.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -MF CMakeFiles/rccl.dir/hipify/src/msccl.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/proxy.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -MF CMakeFiles/rccl.dir/hipify/src/proxy.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 37 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 37 warnings generated when compiling for gfx90a. 37 warnings generated when compiling for gfx1101. 37 warnings generated when compiling for gfx90a. 37 warnings generated when compiling for gfx1102. 37 warnings generated when compiling for gfx1200. 37 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 4 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for gfx1200. 4 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx90a. 4 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx90a. 4 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 2 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/register.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/register.cc.o -MF CMakeFiles/rccl.dir/hipify/src/register.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/register.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc 2 warnings generated when compiling for host. 2 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ 7 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ 245 | s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ tatic ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNodeIn file included from */builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | stat/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ ic ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ 55 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ ub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ 2 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ 2 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(stru2c warnings generated when compiling for gfx1102. t ncclComm* comm, void* handles[], int nranks, int rank, void* liste7 warnings generated when compiling for gfx1200. nComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void*/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ * mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, voiIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, list/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ ** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank)enComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: 2warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* warning nso generatedd when compiling for e,gfx1200 . const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const 7 warnings generated when compiling for gfx90a. char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for host. 55 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from 7 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp 55 warnings generated when compiling for gfx1200. 55 warnings generated when compiling for gfx90a. 55 warnings generated when compiling for gfx1102. 55 warnings generated when compiling for gfx1100. 55 warnings generated when compiling for gfx1201. 37 warnings generated when compiling for host. [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1200. [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 55 warnings generated when compiling for host. [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 13 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ 13 warnings generated when compiling for gfx1101. 13 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 13 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ 13 warnings generated when compiling for gfx1200. 13 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ 13 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ :459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx90a. 30 warnings generated when compiling for gfx90a. 30 warnings generated when compiling for gfx1100. 13 warnings generated when compiling for host. 30 warnings generated when compiling for gfx1201. 30 warnings generated when compiling for gfx1102. 30 warnings generated when compiling for gfx1200. [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 30 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ 1 warning generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | f/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.ccloa:t1044 :t7 := warning: (tunused variable 'nChannels' [-Wunused-variable]v e.tv_sec - tvs.tv_ s1044e | c ) *i1nEt3 n+C h(atnvnee.ltsv _=us e0c; - | t ^~~~~~~~~v s.tv_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.ccu:se1054c:)12/:1 Ewarning: 3unused variable 'y' [-Wunused-variable]; | ^ 1054 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ 1 warning generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ 1 warning generated when compiling for gfx90a. tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc | st:a1712ti:c15 :b owarning: olunused variable 'ringRemap' [-Wunused-variable] isPow2(int val) {1712 | | ^~~~~~ stati/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.hc: 282c:h12a:r warning: runused function 'mirrorBits' [-Wunused-function]i ngRemap[ 62824 | ]s;t a t| i ^~~~~~~~~c int /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.ccm:ir1716r:o7r:B iwarning: tunused variable 'ncpus' [-Wunused-variable]s (int val ,1716 | i n ti npto wn2c)p u{s =| ^~~~~~~~~~s ystem->nodes[CPUIn file included from ]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc.:coun25t: ; /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h :| 75 ^~~~~: 21: warning: unused function 'xmlAlloc' [-Wunused-function]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc :1809:9: warning: unused variable 't' [-Wunused-variable] 75 | static ncclResult_t xm l1809A | l l ofcl(osattr utc t= n(ctcvleX.mtlv*_*s excm l-, tivnst. tmva_xsNeocd)e*s1)E 3{ + | ( ^~~~~~~~t ve.tv_u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.hse:c110 :-21 :t vwarning: sunused function 'xmlGetAttrInt' [-Wunused-function]. tv_usec)/1E3; | ^110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ 1 warning generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ 1 warning generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ lResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclRe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ sult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ 49 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 49 warnings generated when compiling for gfx90a. 30 warnings generated when compiling for host. 49 warnings generated when compiling for gfx1201. 49 warnings generated when compiling for gfx1101. [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc 49 warnings generated when compiling for gfx1100. 49 warnings generated when compiling for gfx90a. 49 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from 163/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h | :s126t: aIn file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.hi:c14 : nIn file included from c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hc:l37R: eIn file included from s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hu:l14t: _t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h :x46m:l13F:i nwarning: dTunused function 'log2i' [-Wunused-function]a gKv(struct ncclXml* xml, c46o | nsstta tcihca rl*o ntga glNoagm2ei,( lsotnrgu cnt) n{c c l| X ^~~~~m lNode** node, const char*In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cca:t11t: r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.hN:a258m:e14,: cwarning: ounused function 'ncclTopoXGMISpeed' [-Wunused-function]n st char* attrV a258l | uset)a t{i c | f ^~~~~~~~~~~~l oat nc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.hc:l192T:o21p:o Xwarning: Gunused function 'xmlSetAttrIfUnset' [-Wunused-function]M ISpeed(const char* 192g | csnt)a t{i c | n ^~~~~~~~~~~~~~~~~c clRes/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.hu:l268t:_14t: xwarning: munused function 'ncclTopoNVLinkBw' [-Wunused-function]l SetAttrIf U268n | ssetta(tsitcr ufclto antc cnlcXcmllTNoopdoeN*V LniondkeB,w (cionnts tc ucdhaaCro*m paCtatpr)N a{m e ,| ^~~~~~~~~~~~~~~~c onst/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h :c279h:a13r:* warning: vunused function 'isPow2' [-Wunused-function]a lue) { 279| | ^~~~~~~~~~~~~~~~~s tatic/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h :b243o:o21l: iwarning: sunused function 'xmlUnsetAttr' [-Wunused-function]P ow2(int 243 | svtaalt)i {c | ^~~~~~nc clR/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.he:282s:12:u lwarning: tunused function 'mirrorBits' [-Wunused-function]_ t xml U282n | ssettaAtitctr (sitrnuctt minrcrcolrXBmiltNso(dien*t novdael, ,c oinsntt cphoawr2)* at{t r| ^~~~~~~~~~N ame) { In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc ^~~~~~~~~~~~: 12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h::255:21117::21 warning: unused function 'xmlGetSub' [-Wunused-function]: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 255 | static nc c117l | Rsetsautlitc_ tn cxcmllRGeestuSlutb_(ts txrmulcGte tnActctlrXImnltNDoedfea*u lnto(dset,r uccotn sntc cclhXamrl*N osdueb*N anmoed,e ,s tcrouncstt ncchcalrX*m laNtotdreN*a*m es,u bi)n t{* v| a ^~~~~~~~~l ue, i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.hn:t281 :d21e:f awarning: uunused function 'xmlGetSubKvInt' [-Wunused-function]l tValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124 :28121 | :s twarning: aunused function 'xmlGetAttrLong' [-Wunused-function]t ic ncclResult_t xm l124G | esttSautbiKcv Innctc(lsRtersuucltt _ntc cxlmXlmGleNtoAdtet*r Lnoondge(,s tcrouncstt ncchcalrX*m lsNuobdNea*m en,o dset,r uccotn sntc cclhXamrl*N oadtet*r*N asmueb,, icnotn6s4t_ tc*h avra*l uaet)t r{N a m| e ^~~~~~~~~~~~~~, con/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.hs:t139 :i21n:t warning: aunused function 'xmlFindTag' [-Wunused-function]t trValue) { | ^~~~~~~~~~~~~~ 139 | s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.ht:a310t:i21c: nwarning: cunused function 'xmlRemoveNode' [-Wunused-function]c lResult_t xm 310l | FsitnadtTiagc( sntcrculcRte snuclctl_Xtm lx*m lxRmelm,o vceoNnosdte (cshtarru*c tt angcNcalmXem,l Nsotdreu*c tn ondcec)l X{m l N| o ^~~~~~~~~~~~~d e** node) /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h{: 323 :| 21 ^~~~~~~~~~: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 323 | static nccl R151e | ssutlatt_itc xnmclcAldRdeTsruelet(_stt rxumcltF inncdcNleXxmtlT*a gd(sstt,r usctt rnuccctl Xnmclc*l XxmmllN,o dceo*n spta rcehnatr,* sttarguNcatm en,c csltXrmulcNto dnec*c lsXrmclNNooddee)* {p r e| v ^~~~~~~~~~, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ mlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNodIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ e* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. 49 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int*In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclCo warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, mcmo*n scto mcmh,a rvo*i*d *s tcro,l lsCtormumc)t {k vNDCiCcLtC*H ECdKi(ccto)m m{- > n| c ^~~~~~~~~~~~~~c lCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 29 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1200. 29 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 29 warnings generated when compiling for gfx1200. 29 warnings generated when compiling for gfx90a. 29 warnings generated when compiling for gfx90a. 29 warnings generated when compiling for gfx1101. 29 warnings generated when compiling for gfx1102. [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for host. [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 15 warnings generated when compiling for gfx1101. 29 warnings generated when compiling for host. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc 2 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1201. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 6 warnings generated when compiling for gfx90a. [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc 2 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1200. 6 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1101. [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx90a. [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1101. [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx1201. 1 warning generatedIn file included from when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1102. [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1201. [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, heIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ad, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1102. [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1201. [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} 1 warning generated when compiling for host. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1100. [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc 6 warnings generated when compiling for host. [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx1102. 3 warnings generated when compiling for gfx1201. 3 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for host. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx1200. 3 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:[ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o 18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1200. [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1201. [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc 2 warnings generated when compiling for host. [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1201. [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ 4 warnings generated when compiling for gfx1100. 4 warnings generated when compiling for gfx1200. 4 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1102. 4 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for host. 15 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for gfx1201. 4 warnings generated when compiling for gfx90a. 4 warnings generated when compiling for gfx1200. 4 warnings generated when compiling for gfx1102. 4 warnings generated when compiling for gfx90a. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 1 warning generated when compiling for gfx1200. In file included from 1 warning generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 1 warning generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 23 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 23 warnings generated when compiling for gfx1101. In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14:170:12: warning: unused variable 'mh' [-Wunused-variable] : warning: unused variable 'info' [-Wunused-variable] 170168 | | gdr_ gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | ivnfoo_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.hid *gdr:Map172; :| ^~~~~~ 9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 1 warning generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 23 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 23 warnings generated when compiling for gfx1201. 23 warnings generated when compiling for gfx1200. 23 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc 23 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 4 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct nIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] cclTopoSystem* system, int dev, int* rank) { 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(intIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 16 warnings generated when compiling for gfx1100. 16 warnings generated when compiling for gfx1200. 16 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 16 warnings generated when compiling for gfx1101. 16 warnings generated when compiling for gfx90a. 16 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 16 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct n c | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ clXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx90a. 23 warnings generated when compiling for gfx90a. 23 warnings generated when compiling for gfx1102. 23 warnings generated when compiling for gfx1101. 23 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 23 warnings generated when compiling for gfx1201. 23 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 16 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for host. 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1201. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx1101. [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 23 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ a; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx1200. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] In file included from 140 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp : 2 : In file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.hi:n10t: 3In file included from 2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h_:t169 : da/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hta:1270,: 19f:l awarning: g1unused variable 'ptr' [-Wunused-variable], data2, flag2; | ^~~~~ 270 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140: 21 : warning: unused variable 'flag1' [-Wunused-variable] uint 61404 | _ t * pturi n= tre3c2vP_trt(0 )d+altl1a281Of,f seft;l a g| ^~~1 , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | 1, dat a2, flag2c; o| ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hn:140s:35: twarning: unused variable 'flag2' [-Wunused-variable] 140 | s suint3i2_t zdatea1, f_lag1,t dat a2, sflagi2; ze = args->count; | ^~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 173 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllGather_RING_LL128_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 173 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllGather_RING_LL128_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cppIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ :2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElementcount; | ^~~~ COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset;/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h | : ^~~ 222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ e, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, nccIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ lFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140: | 667: 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667u | i tnid(ttid3), 2nth_reatds( nthdreaads)t, taidI1nBl,ock (thfrealdIdaxg.x)1, g,roup (grdoupa), t | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ a | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 2 668, | sfteplSizae(stgepS2iz;e_ == 0 ? | nccl ^~~~~Shm em/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h.comm.buffSizes:[NC140CL_:PRO21TO_:SIM PLEwarning: ]/Nunused variable 'flag1' [-Wunused-variable]CCL _S TEPS/sizeo140f(T | ) : st epSi ze_ ) {u i| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ n| group(group t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h32:252:_90: tnote: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252d | a t Praimi1tiv,es,f /*lDirect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ AllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->counIn file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ ; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidstepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMiInnBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Max, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.co/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ mm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFIIn file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, argst-=>*/r0,e PdroOtop, A0>r pgriNE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ms) ;| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h | : ^565: 5:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here :1065565 | : 5 :ru nTnote: reein instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested hereUp D own,T C,OLL _URNeROdLL>O(aprg,s) ; P | ^r /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hotoL:203L:66:1 note: 2in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 8 ,203 | C O L L Ru_nWUorNkERleOmeLntLn,( Ta, rRedgOps, )Al;go , Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16| , ^n c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hclFunc:A203l:l66R:e dnote: uin instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested herec e , 203F | u n c M i n M aRxu,n WhoarlkfE,l eNmCeCnLt_:(406):.52r:u nnote: (expanded from macro 'DEFINE_ncclDevFunc'w e );406 | | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cppRunWo:r5k:<1c:o lnote: lin instantiation of member function 'RunWork, 0, 1, 2>::run' requested here, ty,5 | rDeEdFoIpNc,c laDlegvoF,u nporf(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cot(oA,l l2R>eIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (d).urcuen_(T&RnEcEc_lLSLh1m2e8m_.MwionrMka)x;_ f\1 6 | , ^ n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hcclFu:n667c:A15l:l note: Rfield 'nthreads' will be initialized after field 'tidInBlock'e d uce667, | F u n ctMiidn(Mtaixd,) ,h anltfh,r eNaCdCsL(_nAtLhGrOe_aTdRsE)E,, tNiCdCILn_BPlRoOcTkO(_tLhLr1e2a8d)I d x| .^x /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h), gr:o406u:p52(:g rnote: oexpanded from macro 'DEFINE_ncclDevFunc'u p ),406 | | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h Run:W667o:r60k:< cnote: ofield 'group' will be initialized after field 'stepSize'l l , 667t | y , r edtiodp<(tty>i,d )a,l gnot,h rperaodtso(,n t2h>r(e)a.drsu)n,( &tnicdcIlnSBhlmoeckm(.twhorreka)d;I \d x .| x ^) , group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBloc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hk:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PR/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),OTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hty>, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buff/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | t17 warnings generated when compiling for host. id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/si/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllRe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hduc:e_667R:I15N:G _warning: SIinitializer order does not match the declaration order [-Wreorder-ctor]M PLE_MinMax_bf8, ncclFuncAllReduce, 667F | u n c M itniMda(xt,i dr)c,c ln_tbhfrleoaadts8(,n tNhCrCeLa_dAsL)G,O _tRiIdNIGn,B lNoCcCkL(_tPhRrOeTaOd_ISdIxM.PxL)E,) g r| o^u p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :| 409 tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_: 52: note: expanded from macro 'DEFINE_ncclDevFunc' 409668 | | RsutneWpoSrikzn,c callSghom,e mp.rcootmom,. b4u>f(f)S.irzuens([&NnCcCcLl_SPhRmOeTmO._wSoIrMkP)L;E ]\/ N C| C ^L _STEPS/sizeo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hf:(T667):15 :: st enote: pSifield 'nthreads' will be initialized after field 'tidInBlock'z e_) { | 667 | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group tid(tid), nthreads(nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hh:r62:e56a:d s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ metric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ S/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ : warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edOp, ProtoLL128, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().rIn file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ redop, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/N/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hC:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ CL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp :C2O: LL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h_U:N33R:O19L:L >warning: (unused variable 'size' [-Wunused-variable]a rgs); | ^ 33 | con/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hs:t203 :s66s:i znote: ein instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here_ t size = arg s203- | > c o u n t ; | Run ^~~~Wo rkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFuIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWoIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ rk, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32In file included from _t /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppd:at2a: 1,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :f33l:a19g:1 ,warning: unused variable 'size' [-Wunused-variable]d ata2, flag2; | ^~~~~ 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t si/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ ze = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Prim | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ itives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSizeIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ _ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> pIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ rims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ (group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1200. [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ +ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->coun 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ t; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffs/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ et / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, dataIn file included from 2, fl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cppa:g22;: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h| : ^~~~~10 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h169:: 140:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h28:: 270warning: :unused variable 'data2' [-Wunused-variable]19 : warning: unused variable 'ptr' [-Wunused-variable] 140 | uint32_t data1 ,270 | f l a g 1 , d autian2t,6 4f_lta*g 2p;t r | ^~~~~= rec/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hv:P140t:r35(:0 )warning: +unused variable 'flag2' [-Wunused-variable]l l128Offs e140 | t ; | u ^~~i nt32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidIn/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:B2: In file included from l/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: oIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hc:667:15k: warning: initializer order does not match the declaration order [-Wreorder-ctor]( 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives st,epSi ze(s/tepSi*ze_ D== 0i ? nrcclSehct=*/0, Proto, me0m.co>mm.bu ffSipzes[rNCCims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReL_PROTO_SIMPLE]/In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ etric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ duce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cppunWor:k7<:c1o:l lnote: ,in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here t y, 7r | eDdEoFpIn,c callDgeov,F upnrco(tAol,l R2e>d(u)c.er_uTnR(E&En_cSIcMlPSLhEm_eMmi.nwMoarxk_)u;6 4\, n| c ^c l/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hFunc:A667l:l15R:e dnote: ufield 'nthreads' will be initialized after field 'tidInBlock'c e , F667u | n c M i ntMiadx(,t iudi)n,t 6n4t_htr,e aNdCsC(Ln_tAhLrGeOa_dTsR)E,E ,t iNdCICnBlLo_cPkR(OtThOr_eSaIdMIPdLxE.)x ) ,| ^g /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hroup:(406g:r52o:u pnote: )expanded from macro 'DEFINE_ncclDevFunc', | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h406 | : 667 : 60 :R unote: nfield 'group' will be initialized after field 'stepSize'W o rk667< | c o l l ,t itdy(,t irde)d,o pne,a dasl(gnot,h rperaodtso),, 2t>i(d)I.nrBulno(c&kn(ctchlrSehamdeImd.xw.ox)r,k )g;r o\u p | ( ^g r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.houp):,667 : 15| : ^~~~~~~~~~~ note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group RunWorkElement().ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hn(:we252):90; : | ^note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, 0, 2, 2>::run' requested heres ymmetriccc,lD e/vF*uDnci(ArlelRcedtuc=e_*T/R0E,E_ SPIMrPLoEt_Moin,M a0x_>u6 4p, rnciclmFsu nc A| ll ^R educe, FuncMinMa/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hx,: 565ui:nt56:4_ t,note: Nin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested hereCC L_ALGO_TREE, N565C | C L_ PR OT O_rSuInMPTLrE)e e U| ^p Downc,ol lC, OtLyL,_U NrReOdoLpL<>ty(>,a raglsg)o;, p | r ^o to, 2>().run/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h(:&203nc:c66l:S hnote: min instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested heree m.work) ;203 | \ | ^ Ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:n667W:o15r:k Enote: lfield 'nthreads' will be initialized after field 'tidInBlock'em ent)(,) .triudnI(nweBl)o;ck ( t| h ^r eadIdx.x/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp):,7 :g1ro:u pnote: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here(g roup), | ^~~~~~~~~~~~~~~~~ 7/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h | :D667E:F60I: Nnote: Efield 'group' will be initialized after field 'stepSize' _ncc 667l | D e v F tuindc(t(Aild)l,R ednuthcree_aTdRs(EnEt_hrSeIaMdPsLE)_,M itindMInaBxlo_cuk3(2th,r enadcIdcx.lx)F,u ngcroAlulp(Rgerdouup)c, e ,| F ^~~~~~~~~~~un cMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(a/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rgs); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ INE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hh:r667e:a15d: s(warning: ninitializer order does not match the declaration order [-Wreorder-ctor]t hreads), tidInBlock(threadIdx.x) ,667 | g r otiudp((tgirdo),u pn)th,r e a| d ^~~~~~~~~~~~~~~~~s( nthrea/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hds:)667, :t60id:I nnote: Blfield 'group' will be initialized after field 'stepSize'ock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFun/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we)cAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTr17ee warningUsp generatedDo when compiling for hostw. n, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ n, T, RedOp, Algo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Pr o667 | t o , 0>t ipdr(imtsi d), | n ^t hreads(n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ht:565hr:e5:ad note: sin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here) , tidIn B565 | l o c k(rtuhnreTardIedexU.pxD)o,wn pS,i zCe(OsLteLp_SUiNzeR_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ OLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h_:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); :| ^667 :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h15: warning: :initializer order does not match the declaration order [-Wreorder-ctor]203 : 66: note: 667in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here | 203 | t i d ( t i d ) ,R unntWhorrkEleeamdesn(tn((g)r.oruupn)(,we ) | ; ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | | ^ tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp 668: | 7 : 1 : snote: tin instantiation of member function 'RunWork, 0, 2, 2>::run' requested heree p Siz7e | (DsEtFeIpNSEi_znec_c l=D=e v0F u?n cn(cAclllSRhemdeumc.ec_oTmRmE.Eb_uSfIfMSPiLzEe_sM[iNnCMCaLx__PuR8O,T On_cScIlMFPuLnEc]A/lNlCRCeLd_uScTeE,P SF/uncsMiizneMoafx(,T )u i:n ts8t_etp,S iNzCeC_L)_ A{L G O| _ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~T R E| E group(group, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hNCCL_:P301R:O90T:O _note: Sin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hereI M PLE301) | | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h Pr:i406m:i52t:i vnote: eexpanded from macro 'DEFINE_ncclDevFunc's < T,406 | R e d O pR,u nFWaonrAksX,_ DaElVg_oA,R IpTrYo>t,o ,/ *2D>i(r)e.crtu=n*(/&0n,c cPlrShomtoe,m. w0o>r kp)r;i m\s | | ^ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:667::15565:: 5note: :field 'nthreads' will be initialized after field 'tidInBlock' note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 667 | 565 | t i dr(utniTd),r enetUhprDeoadwsn(p,( gCrOoLuLp_)U,N R O| L ^~~~~~~~~~~~~~~~~L >/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h(ar:g667s:)60;: note: field 'group' will be initialized after field 'stepSize'| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h667 | t:i203d:(66t:i dnote: )in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here, nt203h | r e a d s ( n t hRruenaWdosr), tkiEdlIenmBelnotc().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ )+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncA/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ llReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hcclD:ev667F:u15n:c (warning: Ainitializer order does not match the declaration order [-Wreorder-ctor]l lReduce_TREE_SIMPLE_PreMulSum_bf1 6667, | n c c ltFiudn(ctAildl)R,e dnutcher,e aFdusn(cnPtrherMeualdSsu)m,, thiidpI_nbBflloocakt(1t6h,r eNaCdCILd_xA.LxG)O,_ TgRrEoEu,p (NgCrCoLu_pP)R,O T O| _ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~S I M| P tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_L E) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52668: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitive/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hs ,667 | / * D i rteicdt(=t*i/d0),, Prnotthor,e a0d>s (pnrtihmrse a d| s ^) , tidInBlock(thr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.he:a565d:I5d:x .note: xin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here) , group(grou p565) | , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r u n| T tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_r eeUpDownn,c cClOSLLh_mUeNmR.OLcLo>m(ma.rbgusf)f;S i z| e ^s [NCCL_PROTO_SIMPLE]/NCC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hL:_203S:T66E:P Snote: /in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested heres izeof(T) : 203s | t e p S i z e _ )R u{n W o| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~kE l e| m group(groupe nt()./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hr:u252n:(90w:e )note: ;in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here | ^ 252 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp : 7P:r1i:m inote: tin instantiation of member function 'RunWork, 0, 2, 4>::run' requested herei vesSu,m _/*bDfi1r6e,c tn=*c/c0l,F uPnrcoAtlol,Re d0u>c e,pr imFsun c P| r ^e MulSum, h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hip:_565bf:l5o:at1 6,note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested hereN CCL_ALG O565_ | T R E Eru, nNCTCrLe_PeURpODToOwn_Sll,, CtOyL,L _rUedNoRpy(>,a arlggos, )p;r o t| ^o, 4>().run(&/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:c203c:l66Sh:m note: em.in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested herew ork); 203 \ | | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFdOp, ProtoLL128, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ INE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown29,: Cwarning: OLfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]L _UNROLL>(args); | ^ 504 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ht:i203d:(66:t inote: din instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here) , nthreads( n203t | h r e a d s ) , RwuindW(otrikdE%lWeAmRePn_tS().r u505n | ( w e ) ;w a r| p ^I nBlock(threadIdx./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cppx:/7W:A1R:P _note: Sin instantiation of member function 'RunWork, 0, 2, 2>::run' requested hereI ZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 7 | D E506F | I N E _ nfclcalgDTehvrFeuandc(((AtlildR%e4d)u=c=e3_)T,R EgEr_oSuIpM(PgLrEo_uPpr)e,M u l| S ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~u m _| f warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==31 6, ncclFuncAl l507R | e d u c es,t eFpuSniczPer(enMcucllSSuhmm,e mh.aclofm,m .NbCuCfLf_SAiLzGeOs_[TNRCECEL,_ PNRCOCTLO__PLRLO1T2O8_]S/INMCPCLLE_)S T E| P^S /sizeof(ui/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:t4066:452_:t )note: )expanded from macro 'DEFINE_ncclDevFunc' { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 406 | RunWork9,: al gnote: o, proto, 2>().run(in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncc l503S | h m e m . c o m mp.rbiumfsf(Stiizde-sn[tNhCrCeLa_dPsRSOpTlOi_tS,I MnPtLhEr]e/aNdCsC-Ln_tShTrEePaSd/ssSipzleiotf,( T&)t r:e es-t>euppS,i zter_e)e -{> d o| w ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n , | a group(groupr gs->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h | : 1065 : 5 : note: Pin instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested herer imitivesL,L _/U*NDRiOrLeLc>t(=a*r/g0s,) ;P r o| t ^o , 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hnote: :in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here203 :66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 565 | r203u | n T r e e U p D oRuwnnWN,R OCLOLL>L(_)U.NrRuOnL(Lw>e()a;r g s| ) ^ ; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hin instantiation of member function 'RunWork, 0, 1, 2>::run' requested here: 203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 5203 | | D E F I N E _ n cRcunWloDervkFEulnce(mAenltlnc(A)l.rulnR(ewdeu)c; e| , ^ FuncPreMulS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cppum:,7 :1h: anote: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested herel f, NCCL_ALG O7_T | RDEEEF,I NEN_nCcCLc_PlDReOvTFuOnc(A_LlLl1R2e8d)uce _ T| REE^_S IMPLE_Pr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.heM:u406l:Su52m_:f16 ,note: expanded from macro 'DEFINE_ncclDevFunc'n cclFuncA ll406R | edu ce , FRuunncPWork, aNlCgoCL_,ALG Opr_otTRoEE,, N2C>C().runL_P(R&OTnOcc_lSISMPhLmEe) m | .^w ork); \/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h | ^ :409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*DIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ irect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMultShreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ um, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), grouIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ p(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(In file included from we);/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp : 1| : ^In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cppIn file included from :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h7::141: :In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hnote: :in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here37 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 7 | DEFINE_ncclDevFunc( A46l | lsRteadtuicce _lToRnEgE _lSoIgM2PiL(El_oPnrge Mnu)l S{u m _| f ^~~~~1 6, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElemIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ent().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ vFunc(AllReduce_TREE_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hcomm.:buf222fS:i19z:es [warning: Nunused variable 'size' [-Wunused-variable]CC L_PROTO_LL128]/NCCL_ ST222E | P S/ s i zecofo(nuisntt6 4s_ts)i)z {e _ | t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | s group(groupi ze = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlocIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ k(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitivesd),, nt/hre*adDs(intrhreeacdst),= t*id/In0Bl,ock (tPhrreaodItdxo.x,), g0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) r o| up^(g r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.houp), | : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 409 | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_: 52:668 | note: expanded from macro 'DEFINE_ncclDevFunc' s tepSiz409e(s | te pS iz e_ =R= u0 n? WncoclrShkmeCL,_S TEaPSl/sgizeoof,(T ) p: rstoeptSioze,_) {4 >| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( )| group(group. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hrun(&:n252:c90:c note: lin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here S h252 | m e m .Prwimoitrives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIk); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(thrMePLaE_dPrIeMdulxSu.m_xf3)2,, n ccglFruncoAlulRped(ucge,r FounucPpre)Mu,lSu m , | fl ^~~~~~~~~~~oa t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(gro | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | Rup), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ unWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllRe ^du ce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cppL:E)7 :| ^1 : note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | 7 | D ERFuInNWEo_rnkc_,T RaElEg_oS,I MpPrLoEt_oP,r e2M>u(l)S.urmu_nf(3&2n,c cnlcSchlmFeumn.cwAolrlkR)e;d u\c e ,| ^F uncPreMulSum, fl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ho:a667t:,15 :N Cnote: Cfield 'nthreads' will be initialized after field 'tidInBlock'L _ALGO_TREE, N C667C | L _ P R OtTiOd_(StIiMdP)L,E )n t h| r^e ads(nthreads), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ht:i409d:I52n:B lnote: oexpanded from macro 'DEFINE_ncclDevFunc'c k(threadIdx. x409) | , g r oRuupn(Wgorrokufield 'group' will be initialized after field 'stepSize', algo, proto ,667 | 4 > ( ) .triudn((t&indc)c,l Snhtmherme.awdosr(kn)t;h r\e a d| s ^) , tidInBlock(thre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ha:d667I:d15x:. xnote: )field 'nthreads' will be initialized after field 'tidInBlock', group(group), 667| | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllRedIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ uce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInB/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMP== 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllRe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ duce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_U N667R | OL L > ( atrigds()t;i d )| , ^ nthreads(nthreads), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hI:n203B:l66o:c knote: (in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested heret hreadIdx.x), 203g | r o u p ( g r o uRpu)n,W o r| k ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~E l e| m tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_e nt (=)=. r0u ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: n(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFI 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NE_ncclDevFunc(AllReduce_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElemenRING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ t().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TRE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ E, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp : 1 : tIn file included from i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hd:(17: tIn file included from i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.hd:11): ,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h :12n: tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hh:126r: eIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.ha:d14s: In file included from (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hn:37t: hIn file included from r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hea:d14: s), ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hd:I46n:Bl13o:c kwarning: (unused function 'log2i' [-Wunused-function] thread I46d | xs.txat)i,c lgonrgo ulog2i(long p(group), | ^~~~~~~~~~~ n) { | ^~~~~ UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flaIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ g2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) {In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dop, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ata1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | con/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ st ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllRe17 warnings generated when compiling for host. duce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ m, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, nccl Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ FuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: ulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadId/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreadIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ s(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565 10 | DEFINE_ncclDevFunc(AllReduce_RIN:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :r667u:n15T:r ewarning: eUinitializer order does not match the declaration order [-Wreorder-ctor]p Downn,t hCrOeLaLd_sU(NnRtOhLrLe>a(dasr)g,s )t;i d I| n ^B lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_203 :66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 668 | 203 | s t e p S i zReu(nsWtoerpkSEilzeem_e n=t=< F0n ,? Tn,c cRleSdhOmpe,m A.lcgoom,m .PbruoftfoS,i zCeOsL[LN_CUCNLR_OLPLRO>T(O)_S.rIun(MPweL);E ]| ^/ NCCL_STEP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cppS:/7:s1:i note: zin instantiation of member function 'RunWork, 0, 2, 2>::run' requested here eof(T) : st 7e | pDSEFiINzeE__) nccl{D e| v ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~F u n| c(A group(groupl lReduce_TREE_SIMP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hLE:301:90_:P rnote: eMin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereulSu m_u8, ncclF 301u | n c A ll RPriedumcie, tFiuvnecsPrM,PL E/)*D ir| ec^t =*/0, Proto/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h,: 406:052>: pnote: rexpanded from macro 'DEFINE_ncclDevFunc' ims | ^406 | RunWor/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hk:<565:co5ll:, ty, note: rin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested heree dop, a565l | g o, rpruontoT,r 2>e(e)U.rpuDno(w&nnccl, C OL667 | L_ U NR OL L>(tarigds(t)i;d )| ^, nthreads(nthre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hads:203):66,: tnote: iin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested heredInBl ock(thr e203a | dI dx .x) , gRrunWorkoEluemepn(tgi(d)),. ntrhurne(awde);s( n t| h ^re ads), tidIn/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cppBl:o7c:k(1t:h note: rin instantiation of member function 'RunWork, 0, 2, 2>::run' requested heree adIdx.x), g7r | oDuEpF(gIroNuEp_)n,c cl De| v ^~~~~~~~~~~ Func(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_tG_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ , NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ metric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ MPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dop, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitivescount; | ^~~~ , FanAsymmetric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ INE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(thre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 28, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ Down, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group( 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 17 warnings generated when compiling for host. group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSifield 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidI 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ ((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ Sum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffIn file included from Sizes[/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cppN:CC2L_: PRIn file included from O/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hT:O_10S: IMIn file included from PL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hE:]/169N: CCL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h_S:TE270P:S19/:si zewarning: ofunused variable 'ptr' [-Wunused-variable]( T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 270 | uint64_t* ptr = re/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hc:v62:P56t:r (note: 0in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here) +ll128Of f62s | e t ;P ri m| it ^~~iv es, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(th/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hreadId:x.667x:)15, :g rwarning: ouinitializer order does not match the declaration order [-Wreorder-ctor]p( group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667667 | | t id (ttiidd),( tntihdre)a,ds (nntthhrreaedasd),s t(indItnhBlroecka(dtsh)re,a dItdix.dx)I,n Bgrlooupc(kgr(otuhpr),e a | ^~~~~~~~~~~ dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssizIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ e_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCC8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ 17 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | nRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: 10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ : warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tidDEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ em.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),CL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | 17 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ warnings generated when compiling for host. | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | L_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h21 warnings generated when compiling for gfx90a. :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 17 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ c(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.wo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclSh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFuIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(mem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncnc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1201. 21 warnings generated when compiling for gfx90a. [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffse/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ t / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ : warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreadIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | s), tidInBlock(t hr e a d IRudnxW.oxr)k,E lgermoeunpt(( )667. | r u n ( wtei)d;( ti d| ) ^, nthreads(nthreads), tidInBlock(threadIdx.x), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cppg:ro7u:p1(:g rnote: oin instantiation of member function 'RunWork, 0, 2, 2>::run' requested hereu p), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFunc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cppn:1: In file included from c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.hc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76l:18: warning: unused variable 'y' [-Wunused-variable] S76 | h umint32_et y, hmead, m.antissacomm.buffS;i | ^z es[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*DirIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ ect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ CCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Symmetric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdxIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ .x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ roup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_S17 warnings generated when compiling for gfx1102. TEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0oup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ht:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ epSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthread/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hs:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here (nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | fl:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ agThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement()In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h);: 667 :| 15 ^: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203667 | | t i d (RtuindW)o,r knEtlhermeeandts<(Fnnt,h rTe,a dRse)d,O pt,i dAIlngBol,o cPkr(otthor,e aCdOILdLx_.UxN)R,O LgLr>o(u)p.(rgurno(uwpe)),; | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ^ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp: 7668 | : 1 : note: sin instantiation of member function 'RunWork, 0, 2, 4>::run' requested heret epSize(stepSize_ = =7 | 0D E?F InNcEcl_SnhcmcelmD.ecvoFmumn.cb(uAflflSiRzeedsu[cNeC_CTLR_EPER_OSTIOM_PSLIEM_PSLuEm]_/bNfC1C6L,_ SnTcEcPSl/FsuinzceAolflRedu(ceT,) F:u nsctSeupmS,i zhei_p)_ b{f l o| a ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t 1 6| , group(group NCCL_ALGO_TREE, NCCL_PROTO_SI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hMP:L252E:)90 : | note: ^in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h252 | : 409 : 52 : note: Pexpanded from macro 'DEFINE_ncclDevFunc'r imitives_,A RaIlTgYo,, 1p>r,o t/o*,D i4r>e(c)t.=r*u/n0(,& nPcrcoltSoh,m e0m>. wporrikm)s; \| ^ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h::565667::515:: note: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested herefield 'nthreads' will be initialized after field 'tidInBlock' 565 | 667 | r utniTdr(eetUipdD)o,w nnx,. xC)O,L Lg_rUoNRuOpL(Lg>r(oaurpg)s,); | | ^~~~~~~~~~~~~~~~~ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h667: | 203 : 66 : tnote: iin instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested hered (tid), nthr e203a | d s ( n t h r e aRdusn)W,o rtkiEdlIenmBelnotc().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ clDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Dire/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ m.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthrereads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ flagThread(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h&:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCncclShmem.work); \ | ^ CL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , redop, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 409 | RunWork667, | a l g o ,t ipdr(ottiod,) ,4 >n(t)h.rreuand(s&(nnctchlrSehamdesm).,w otrikd)I;n B\l o c| k ^( threadIdx.x),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :g667r:o15u:p (note: gfield 'nthreads' will be initialized after field 'tidInBlock'r oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_667 | tid(tid), n t668h | r e a d ss(tnetphSriezaed(ss)t,e ptSiidzIen_B l=o=c k0( t?h rnecacdlISdhxm.exm).,c ogmrmo.ubpu(fgrfoSuipz)e,s [ N| C ^~~~~~~~~~~~~~~~~C L_PRO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hT:O667_:S60I:M Pnote: Lfield 'group' will be initialized after field 'stepSize'E ]/NCCL_STEP S667/ | s i ze o ft(iTd)( t:i ds)t,e pnStihzree_a)d s{( n t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d group(groups ), tidInBlo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ck(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / chanIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:n19elCount; | ^~~ : warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ARITY, 1>, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nth 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buf/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ fSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h667:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllR/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ educe, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCIn file included from CL_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cppA:L1G: OIn file included from _/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hR:I17: NIn file included from G/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h,:11 : In file included from N/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:C12: CIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hL:126_: In file included from P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.hR:14O: TIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hO:37_: SIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hI:14M: P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hL:E46):13 : warning: | ^unused function 'log2i' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 46 | st a409ti | c l on g lRogu2ni(Wloonrg kn<) c{o l| l ^~~~~ , ty, redop, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffse/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2t: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:/168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h: 140:14: cwarning: unused variable 'data1' [-Wunused-variable] h140a | n uinnt32_te datla1, Cflago1, duata2,n flag2; | ^~~~~ t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140;:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | | u ^~~int3 2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().rIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ un(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreadIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: \In file included from | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ s(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | PrimitiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ves, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uintIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_Roup(group), | ^~~~~~~~~~~ In file included from ING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hPrimitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElementIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Op, FanSymmetric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(ntIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, alg/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] o, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threa:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' dIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _UNROLL>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ty, redop, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ um, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement()/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ .run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllRedu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ ce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo,x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads),In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ duce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 12 | DEFINE_ncclDevFunc(AllReduce_RIN G667_ | S I M P LtEi_dS(utmiPdo)s,t Dnitvh_rie3a2d,s (nnctchlrFeuandcsA)l,l RteidduIcneB,l oFcukn(ctShurmePaodsItdDxi.vx,) ,i ngtr3o2u_pt(,g rNoCuCpL)_,A L G| O ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~_ R I| N tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_G , NCCL_PROTO_SI M668P | L E ) s| t^e pSize(stepSize_ == 0 ?/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h n:c406c:l52S:h mnote: eexpanded from macro 'DEFINE_ncclDevFunc'm .comm.buffSize s406[ | N C C L _RPuRnOWToOr_kSi,z eaolfg(oT,) p:r osttoe,p S2i>z(e)_.)r u{n ( &| n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c c l| S group(grouph mem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h::15252:: 90note: :field 'nthreads' will be initialized after field 'tidInBlock' note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 667 | 252 | t i d ( tPirdi)m,i tnitvherseg,r o/u*pD)i,r e c| t ^~~~~~~~~~~~~~~~~= */0, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hP:r667o:t60o:, note: 0field 'group' will be initialized after field 'stepSize'> prims | ^ 667 | tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h(:t565i:d5):, note: nin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested heret hreads(nthre a565d | s ) , triudnITnrBeleoUcpkD(otwhnr, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ MPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_UNROLL>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkEle/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hment().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFu17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMIn file included from PLE]//builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cppN:CC2L: _In file included from S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hT:E10P: SIn file included from //builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hs:i168z: eo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hf:(140T:)14 :: warning: sunused variable 'data1' [-Wunused-variable]t epSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h301::90140:: 21note: :in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here warning: unused variable 'flag1' [-Wunused-variable] 140 | 301 | u i n t 3P2r_itm idtaitveas1<,T ,f lRaegd1O,p ,d aFtaan2A,s yfmlmeatgr2i;c < 1| , ^~~~~ NCCL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h_:M140A:X28_:D Ewarning: Vunused variable 'data2' [-Wunused-variable]_ ARITY>, /140* | D i r e cuti=n*t/302,_ tP rdoattoa,1 ,0 >f lpargi1m,s d a| t ^a 2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h::5140:: 35note: :in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here warning: unused variable 'flag2' [-Wunused-variable] 140 | 565 | u irnutn3T2r_ete UdpaDtoaw1n,< Tf,l aRge1d,O pd,a tPar2o,t ofSliamgp2l;e < 1| ^~~~~, 1, COLL_UNROLL>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = argIn file included from s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t*In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 409 | RunWork, algo, proto, 4>().run(&ncclShmIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ em.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, da/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | ttid(ati2d),, nftlhraega2d;s( nt h| r ^~~~~e ads), tidInBlock(threadIdx.x), gro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hup:(g140r:o35u:p )warning: ,unused variable 'flag2' [-Wunused-variable] | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: 140field 'group' will be initialized after field 'stepSize' | uint32_ t667 | d a t a 1t,i df(ltaigd1),, dnatthar2e,a dfsl(angt2h;r e a| d ^~~~~s ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SuIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ mPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives , /*Direct=*/0, Proto, 0> prims | ^ 667 | tid(ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hd:565):5,: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested heren threads(nth r565e | a d s r)u,nT rteeiUdpDIonwBn,p )C,OL L _U| NR ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~O LL >| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ar gs); | ^ 668 | step/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hS:203i:z66e: (note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested heres tepSize_ = =203 | 0 ? RnucncWolrkSEhlemmeenmt.I(M).PrLuEn(]w/e)N;C C| L ^ _STEPS/sizeo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cppf:7(:1T:) note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here: stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | 7 group(group | D EFINE_ncclDevFunc(AllReduce_TREE_S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIM:P301LE:_S90u:mP osnote: tDin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herei v_i64, ncclFuncA ll301Re | d uc e, F u ncPSrumiPmositDtiiv,v ienst6<4T_t,, RNCeCLd_AOLpG,O _TFREaEn,A NsCyCLm_PmReOTtOr_SiIcMexpanded from macro 'DEFINE_ncclDevFunc' , /*Direct=* /406 | 0 , RPurnWoortkt y,p rreidmop| , ^a lgo, pro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hto:565,: 52:> (note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ).run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ MPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1100. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1100. 21 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1200. 21 warnings generated when compiling for gfx90a. [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 50321 warnings generated when compiling for gfx90a. | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ clFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SI/M*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, P/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlocroto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head21 warnings generated when compiling for gfx90a. , mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); 17\ warning s generated| ^ when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we);In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidIInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostD:i667:15:v warning: initializer order does not match the declaration order [-Wreorder-ctor], 667 | u itid(tnid),t nth6read4s(nth_readts), ,tidI nBloNck(tChreaCdIdLx.x)_, grAoup(LgroupG), O| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ _| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ R668I | N G, NCCL_PROTstepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWoOr_SkIMPLEE) l| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.he:m406:52:e note: expanded from macro 'DEFINE_ncclDevFunc' n 406 | t R, a lgo,R proeto, d2>()O.runp(&ncc,lS hmemA.worlk); \g | o ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h,:667 :15: Pnote: field 'nthreads' will be initialized after field 'tidInBlock' r667 | o ttid(otid),, nth reaCds(ntOhreaLds),L tidI_nBloUck(tNhreaRdIdxO.x),L grouLp(gr>oup)(, )| ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h.:667:r60: note: field 'group' will be initialized after field 'stepSize'u n667 | ( tiwd(tied), n)thre;ads( nth reads| ), t ^idIn B/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpplock(threadIdx.x), gro:up(gr7oup):, 1| ^~~~~~~~~~~ : note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RuIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ nWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ Idx.x), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ IMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NROLL>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.hinitializer order does not match the declaration order [-Wreorder-ctor]: 35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitive s667< | T , R etdiOdp(,t iFda)n,S ynmtmherteraidcs<(1n>t,h r0e,a dPsr)o,t ot,i d0I>n Bplroicmks( t h| r ^e adIdx.x), group/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h(:g80r:o5u:p )note: ,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 80 | runRing=( a0r g?s )n;c c l| S ^h mem.comm.buffSizes[NCCL_PROTO_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hS:I203M:P66L:E ]note: /in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested hereN CCL_STEPS/si z203e | o f ( T ) : sRtuenpWSoirzkeE_l)e m{e n t| < ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~F n ,| group(groupT , RedOp, Algo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp : 3 :P1r:i mnote: iin instantiation of member function 'RunWork, 1, 2, 2>::run' requested heret ivesc,l D0e,v FPurnoct(oA,l l0T>o AplrliPmisv o t| _ ^R ING_SI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here M 80P | L E _ S urmu_niR8i,n gn,( airngts8)_;t , | N ^C CL_ALGO_RING, NCCL_P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hR:O203T:O66_:S Inote: Min instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested hereP LE) | ^ 203 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h : 406 :R52u:n Wnote: oexpanded from macro 'DEFINE_ncclDevFunc'r kElementR,O LaLl>g(o),. rpurno(twoe,) ;2 > (| ) ^. run(&ncclSh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cppm:e3m:.1w:o rnote: kin instantiation of member function 'RunWork, 1, 2, 2>::run' requested here) ; \ | ^ 3 | DEF/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hI:N667E:_15n:c cnote: lfield 'nthreads' will be initialized after field 'tidInBlock'D evFunc(AllToA l667l | P i v o tt_iRdI(NtGi_dS)I,M PnLtEh_rSeuamd_si(8n,t hnrcecaldFsu)n,c AtlildTIonABllloPcikv(otth,r eFaudnIcdSxu.mx,) ,i ngtr8o_utp,( gNrCoCuLp_)A,L G O| _ ^~~~~~~~~~~~~~~~~R ING, N/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hC:C667L:_60P:R Onote: Tfield 'group' will be initialized after field 'stepSize'O _SIMPLE) | ^ 667 | ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hd(:t406i:d52):, note: expanded from macro 'DEFINE_ncclDevFunc'n threads(nthr e406a | d s ) , RtuindWIonrBklr,o uapl(ggor,o uppr)o,t o | , ^~~~~~~~~~~ 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, PIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:421:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 421 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ roto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t,In file included from NC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cppC:L2_: AIn file included from L/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hG:O10_: RIn file included from I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hN:G169,: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hNC:C506L:_29P:R Owarning: Tfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]O _SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc'504 | tid(t i406d | ) , n tRhurneWaodrsk(W,A RaPl_gSoI,Z Ep)r,o twoa,r p2(>t(i)d./rWuAnR(P&_nScIcZlES)h,m e m| . ~~~~~~~~~~~~~~~~~~w o r| k stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) ; \ | ^ 505 | warpInBloc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hk:(667t:h15r:e anote: dfield 'nthreads' will be initialized after field 'tidInBlock'I dx.x/WARP_SIZE), 667 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | t warp(tid/WARP_SIZEi d(tid), n506t | h r e a dfsl(angtThhrreeaadds()(,t itdi%d4I)n=B=l3o)c,k (gtrhoruepa(dgIrdoxu.px)),, g| r ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~o u p| ( warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 group), | ^~~~~~~~~~~~~~~~~ 507 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h : 667s:t60e:p Snote: ifield 'group' will be initialized after field 'stepSize'z e(ncclShmem .667c | o m m . btuifdf(Stiizde)s,[ NnCtChLr_ePaRdOsT(On_tLhLr1e2a8d]s/)N,C CtLi_dSITnEBPlSo/cski(ztehorfe(audiIndtx6.4x_)t,) )g r{o u p| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g r o| u group(groupp ), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:461:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 461 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:503:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 503 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1065:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128, 2>' requested here 1065 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tid:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), InBlnock(threatdIdx.x), grhoup(grourp), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSi 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ NG_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:1057:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 1057 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:109:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 109 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Broadcast_RING_LL128_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:109:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 109 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Broadcast_RING_LL128_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SI17 warnings generated when compiling for gfx1100. MPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. 9 warnings generated when compiling for gfx1101. 1 warning generated when compiling for host. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1201. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1200. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | In file included from uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1200. 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | fl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ agThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:4089 warnings generated when compiling for host. :3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx90a. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp 21 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), war/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARPp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ _SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PRIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)OTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ , group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ CESTEPS, MSCCL_SLICESTEPS, 2>, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 21 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[9N warnings generated when compiling for gfx1101. CCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), 9 warnings generated when compiling for gfx90a. | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ : warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.com/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: m.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:149 warnings generated when compiling for gfx1100. : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(99 warnings generated when compiling for gfx90a. warnings generated when compiling for gfx1102. group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | In file included from uint/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp3:21_: tIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.ha:t13a: 1In file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h :f168l: a/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hg1:,140 :d14a:t awarning: 2unused variable 'data1' [-Wunused-variable], flag2; | ^~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | PrimiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreaat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), n mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tidIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ %WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ >, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WAR/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ P_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h: In file included from :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:506167:: 29:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h warning: :667field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]: 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 504 | t667i | d ( t i dt)i,d (nttihdr)e,a dnst(hnrtehardesa(dnst)h,r ewaidds()t,i dt%iWdAIRnPB_lSoIcZkE()t,h rweaardpI(dtxi.dx/)W,A RgPr_oSuIpZ(Eg)r,o u p| ) ~~~~~~~~~~~~~~~~~~, | | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 505 | war p668I | n B l o cskt(etphSriezaed(Isdtxe.pxS/iWzAeR_P _=S=I Z0E )?, n c| c ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l S h| m warp(tid/WARP_SIZEe m.comm.bu f506f | S i z e sf[lNaCgCTLh_rPeRaOdT(O(_tSiIdM%P4L)E=]=/3N)C,C Lg_rSoTuEpP(Sg/rsoiuzpe)o,f ( T| ) ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ : | s warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3t epSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~507 | | group(group stepSize(ncclShmem.comm.buffSiz/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.he:s220[:N57C:C Lnote: _in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereP ROTO_LL128 ]220/ | N C CPLr_iSmTiEtPiSv/essi, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:: 3note: :in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here1 : note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 220 | 3P | rMiSmCiCtLi_vIesMP,_ T1Y,P EP(rPortood,, 0f>l oparti,m sf a l| s ^e ); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h1::408 :note: 3in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 3 | MSCCL_IMPL _408K | E R NmEsLc_cElNRTuRnYI_nFtUeNrCp_rDeEtVeRrEs,e )P;r o t| o^S imple#,d efvurleldOopps<>t(ycpoem>m,, Parlogtoo,L Lw1o2r8k,) ;f u\l l O| p ^s >(comm, algo, w/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ho:r667k:)15;: \note: field 'nthreads' will be initialized after field 'tidInBlock' | ^ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2,[ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o flag2; | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | 168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | t 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.bu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ tepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTOIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o 9 warnings generated when compiling for gfx1102. /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp 99 warnings generated when compiling for gfx1201. warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ pe, Func##devredop, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreadsIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ (nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, In file included from f/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buflag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ fSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.com/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ m.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: In file included from note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_:506:29: Fwarning: UNC_Dfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]EVRED OP_T YPE(Sum, hip_bfloat16, fa504 | tid(lste); i| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.hd:408), nthreads(nthreads), wi:d3: note: (expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' t408 | imsccldRunIn%terprWeteARP_SIZrE, ProtoSimple, fullOps>(comm, algo, woZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL12r8k); ]\ | / ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hN:667:15:C note: field 'nthreads' will be initialized after field 'tidInBlock'In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ C 667 | L tid(t_id), SnthreTads(nEthreaPds), StidI/nBlock(sthreaidIdzx.x), egroupo(groufp(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUnote: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBloIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ck(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buf/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ fSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx90a. [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp 9 warnings generated when compiling for gfx90a. [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp 9 warnings generated when compiling for gfx90a. [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | In file included from ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h: :In file included from 667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h::1514:: In file included from note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hfield 'nthreads' will be initialized after field 'tidInBlock': 17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from 667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h | : 126 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.ht:i14d: (In file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hi:d37): ,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hn:t14h: re/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.had:s46(:n13t:h rwarning: eunused function 'log2i' [-Wunused-function]a ds), tidInBlock(threadIdx. x46) | ,s tgartoiucp (lgornogu pl)o,g 2 i| ( ^~~~~~~~~~~~~~~~~l ong n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h): 667{: 60 :| ^~~~~note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ Interpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads)In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | PrimitIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? nIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx90a. [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uin/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagTht32_t y, head, mantissa; | ^ read((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ InBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Max, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMin/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here Max, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flaIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ g2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa;In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h,:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, a FuncMinMax, rccrgs->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ l_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next,In file included from arg/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpps:->1s: eIn file included from nd/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hb:u17f: fIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h :a11r: gIn file included from s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h-:>12r: eIn file included from c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hv:b126u: fIn file included from f/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h,: 14: aIn file included from r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hg:s37-: >In file included from r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.he:d14O: pA/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hr:g46,: 130:, warning: arunused function 'log2i' [-Wunused-function]g s->connIndex, args->conn I46n | dsetxa)t;i c | l ^o ng log2i(lon/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.hg: 63n:)5 :{ note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here | ^~~~~ 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warningIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ s generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSizIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ e(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, argsIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_M9 warnings generated when compiling for host. inMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ evFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. :60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp 10 warnings generated when compiling for gfx90a. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.bufIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ fSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid)In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ _ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunW/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ork, algo, proto, 4>().run(&ncclShmem.worIn file included from k); \ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:| 2: In file included from ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: :initializer order does not match the declaration order [-Wreorder-ctor] 667 :667 | 15 : ti d(tnote: id)field 'nthreads' will be initialized after field 'tidInBlock', n thr eads(nthre667ads | ), tid InB loc k(tthreiadIddx.(x),t grioupd(gr)oup,), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ n | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ t668h | r setepaSizde(sstep(Sizne_ t== h0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDereads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ vFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' L_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here tidInBlo33ck | (t hr ea dI dx .x ),p grroiupm(gsro(upt),i d| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_n 668t | h r setepaSidzes(s,te pS&izre_i =n= g0 -? >ncpclrShemevm.,co mm&.brufifSngiz-es>[NnCCeL_xPRtOT,O_ SIaMPrLEg]/sNC-CL>_SsTEePSn/sdizebofu(Tf) f: ,st epaSirzeg_)s {- >| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ e| c group(group v/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.hbu:33f:7f: ,note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here ar33g | s - > prriemsd(tOidp, Antrhrgea,ds , 0&r,in g-a>prregv,s &-ri>ngc->onenxtn, Iarngsd->esexnd,buf f,a arrggs-s>r-ec>vcbuoff,n anrgIs-n>rdedeOpxAr)g,; 0 , a| rgs ^-> c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.honnIndex,: a63rgs->:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_AconnIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RLGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize'ING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gr o up),667 | | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h t:i667d:(60t:i dnote: )field 'group' will be initialized after field 'stepSize', nth667r | e a d s (tnitdh(rteiadd)s,) ,n tthirdeIandsB(lnotchkr(etahdrse)a,d Itdixd.Ixn)B,l ogcrko(utph(rgeraoduIpd)x,. x )| , ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); In file included from | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h: :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h77::6675::15: note: warning: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested hereinitializer order does not match the declaration order [-Wreorder-ctor] 77 | runRinge(aadrsg(sn)t;h r e| a ^d s), tidInBlock(threadI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hd:x203.:x66):, note: gin instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested herer oup(group), 203| | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ RunWorkElement <668F | n , T ,s tReepdSOipz,e (Asltgeop,S iPzreo_t o=,= C0O L?L _nUcNcRlOSLhLm>e(m)..croumnm(.wbeu)f;f S i| z ^e s[NCCL_PROTO_SIMP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cppL:E5]:/1N:C Cnote: Lin instantiation of member function 'RunWork, 1, 1, 2>::run' requested here_ STEPS/sizeof(T) : 5s | tDeEpFSIiNzEe__n)c c{l D evFunc(Reduce_RING_LL128_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h(long n) { | ^~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bflo 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ at8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ at8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ :10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ d/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSi_zSIMPLE]/NCCL_STEPS/sizeof(T) : stepSizee_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 9 warnings generated when compiling for host. 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args-In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ >recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 9 warnings generated when compiling for gfx1100. 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, a10 warnings generated when compiling for gfx90a. rgs->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h: ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(thIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x):667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), groupreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ , group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | , RedOp, Proto, COLL_UNROLL>(args) ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreaIn file included from ds/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp(:n1t: In file included from hre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ha:d17s: In file included from ), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.hti:11d: IIn file included from n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.hBl:oc12k: (In file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hh:re126a: dIIn file included from dx/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h.:14: xIn file included from )/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h, gr:o37u: pIn file included from (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:g14r: o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 46 | s| t tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_atic long log2i (668l | o n sgt enp)S i{z e | ( ^~~~~st epSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hthreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_S:667:15I: warning: initializer order does not match the declaration order [-Wreorder-ctor] MPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->rec667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/svbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args);i zeof( T) : st| epSize ^_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims:(tid, nt203hreads:, &rin66g->pre:v, &rin g->nexnote: t, argin instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested heres->sendb uf 203 | RunWorkElefm, argse->recvnbuff, targs->connIlgo, Proto, COLL_UNROLL>()nde.x, argsr->connuIndex)n; | ^ (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.hwe);:63:5 : | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_n cnote: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here c63 | lrunRingD(arges); ,| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: Fnote: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here u203 | ncProd, uint32_t, N C RuCnWorkELlement<_Fn, T,A LGO_RING, NCCL_PROTO_SIMPLE) RedOp, Alg| o, Pro^to, COL L_UNRO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hLL>().:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork:7:1: ,note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINaE_nccllDevFungc(Redo, proto, 2>().run(&nuce_RING_cSIMPLE_cProd_ul32, nShmem.work); \ | cclFunc ^Reduce , Fun/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hcPro:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' d , uint32_t, NCC667 | tid(tid), nthreL_ALGOa_RING,d NCCL_sPROTO_(SIMPLEn) threads | )^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h,:409: tidInBlock(threadIdx.x), grou52:p note: expanded from macro 'DEFINE_ncclDevFunc' (409 | g RunWorrk, algo, proto, 4>().run(&ncclShmem.work);:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, pIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ roto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArgIn file included from , 0/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp,: 1a: rIn file included from g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hs:-17>: cIn file included from o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.hn:n11I: nIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.he:x12,: In file included from a/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hr:g126s: -In file included from >/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.hc:o14n: nIn file included from I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hn:d37e: xIn file included from )/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h;: 14 : | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h ^ :46:13: warning: unused function 'log2i' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h: 6346: | 5s:t anote: tin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested herei c long log 263i | ( l o n gr unn)R i{n g <| T ^~~~~, RedOp, Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ GO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ m.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ o, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElementl(,) .tryu,n (rweed)o;p < t| y ^> , algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667: 155: | Dnote: Efield 'nthreads' will be initialized after field 'tidInBlock'F INE_ncclDevFunc( R667e | d u c e _tRiIdN(Gt_iLdL)1,2 8n_tPhrroeda_dus8(,n tnhcrcelaFdusn)c,R etdiudcIen,B lFoucnkc(Ptrhorde,a duIidnxt.8x_)t,, gNrCoCuLp_(AgLrGoOu_pR)I,N G ,| ^~~~~~~~~~~~~~~~~N CCL_PR/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hO:T667O:_60L:L 1note: 2field 'group' will be initialized after field 'stepSize'8 ) | ^ 667 | t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hi:d406(:t52i:d )note: ,expanded from macro 'DEFINE_ncclDevFunc' nthreads(nth r406e | a d s ) ,R utniWdoIrnkBg,r oaulpg(og,r opruopt)o,, 2| > ^~~~~~~~~~~( ).run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connInd/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | Ruex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/size 46 | static long log2i(long n) { | ^~~~~ of(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: In file included from unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | 140 | uint 32_t udata1i, flang1, dtata2,6 flag42; _| ^~~~~ t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthrea/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElementprev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ T, RedOp, Algo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, argIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ s->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreaIn file included from ds, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ , group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ )+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &rinIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclg->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ FuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1201. [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp 10 warnings generated when compiling for gfx90a. [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uIn file included from int/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp3:22_: tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hd:a10t: aIn file included from 1/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h,: 169f: la/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hg1:,270 :d19a:t awarning: 2,unused variable 'ptr' [-Wunused-variable] flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21 :270 | warning: unused variable 'flag1' [-Wunused-variable] 140ui | n t 64 _uti*n tp32t_rt d=a tra1ecv,P fltar(g01, )da+tlal21,2 8flaOgf2;f | s ^~~~~e t; /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h: | ^~~ 140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ int32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreaIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oup(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagTh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | rread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ roup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp 10 warnings generated when compiling for gfx90a. [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ FuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, aIn file included from rgs->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: :In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: 667In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167:: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:60667::15: warning: initializer order does not match the declaration order [-Wreorder-ctor]note: field 'group' will be initialized after field 'stepSize' 667 | tid(ti667d), | nt hre ads (nt hretads)i, tdidI(nBltocki(thdrea)dId,x.x ), ngrotup(hgrorup)e, a| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ d | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ s 668( | n sttephSizre(esteapSize_d ==s 0 )? n,ccl Shmtem.icomdm.bIuffSnizeBs[NlCCLo_PRcOTOk_SI(MPLtE]/hNrCCL_eSTaEPSd/siIzeofd(T)x : .stexpSi)ze_,) { | g ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ r| group(group o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hup:34(:7:g note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested herer o34u | p ) pr,ims( ti d, | nth ^~~~~~~~~~~read s, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ c(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidI:n667:15B: warning: linitializer order does not match the declaration order [-Wreorder-ctor] oc667 | k ( titd(htird),e nthreaadsd(ntIhredadsx), .tidxInB)loc,k(t hregadIdrx.xo), ugropup((grogup)r, o | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ u | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ p)668 | , st epSi| ze( ^~~~~~~~~~~~~~~~~ste pS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hize_ == 0 :? n667ccl:Shm60em.:com m.bnote: ufffield 'group' will be initialized after field 'stepSize'Siz es[ NCCL_PROT667O_SI | MPL E]/ NCC L_S TEPtS/siizedof((T) t: sitepdSiz)e_) ,{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n | t group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hhr:e34:a7: note: din instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here s 34( | n t hprirmse(tiad, dnthsrea)ds,, &r ingt->priev,d &rIingn->nBextl, aorgsc->skend(buftf,h arrgeadIdx.x), group(group), | ^~~~~~~~~~~ s->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 10 warnings generated when compiling for gfx90a. 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tidf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex);/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp | : ^ 1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h: :In file included from 65:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h5::11 : note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h: 126: 65 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h : 14 : rIn file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hn:R37i: nIn file included from g(args); | ^ 46 | static lo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:g203 :l66o:g 2note: iin instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here( long n) { | ^~~~~203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from 9 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(lo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, a/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ rgs->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring-/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(ntIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->rehreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ dOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | step tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthre 46 | static long log2i(long n) { | ^~~~~ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint3In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, da2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | ta2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceSca/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ tter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. 9In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, aIn file included from lgo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp,: p2r: oIn file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.ho:,10 : 4In file included from >/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h(:)167.: ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hn(:&667n:c15c:l Swarning: hinitializer order does not match the declaration order [-Wreorder-ctor]m em.work); \ | ^ 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :t667i:d15(:t inote: dfield 'nthreads' will be initialized after field 'tidInBlock') , nthreads(nt h667r | e a d s )t,i dt(itdiIdn)B,l oncthreads(ntkh(rtehardesa)d,I dtxi.dxI)n,B lgorcoku(pt(hgrreoaudpI)d,x . x| ) ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, g| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_o up(group), | ^~~~~~~~~~~~~~~~~ 668 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hs:t667e:p60S:i znote: efield 'group' will be initialized after field 'stepSize'( stepSize_ =667= | 0 ? tnicdc(ltSihdm)e,m .nctohmrme.abdusf(fnStihzreesa[dNsC)C,L _tPiRdOITnOB_lSoIcMkP(LtEh]r/eNaCdCILd_xS.TxE)P,S /gsriozuepo(fg(rTo)u p:) ,s t e| p ^~~~~~~~~~~S ize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grouIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ pArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ roup), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZEIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. ), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 99 warnings generated when compiling for gfx1102. warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sumflag1, data2,_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeofIn file included from (T) : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cppst:e2pS: izIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h_): 10{: In file included from | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h : | 168 group(group: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h :34140: | 7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here uint32_t data1, fl 34a | g 1 , pdriamst(at2id,, nfthlraeadgs,2 ;& ri n| g- ^~~~~> prev, &/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hri:ng140-:>n21ex:t , warning: aunused variable 'flag1' [-Wunused-variable]r gs->send bu140ff | , a rg s ->uriecnvbtu3ff2,_ targ s-d>raetdaOp1A,rg , f0l, aarggs1-,> condnIandtexa, 2ar,g s-f>clonanIgn2de;x ); | | ^~~~~ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hunused variable 'data2' [-Wunused-variable]: 65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 140 | ui n65t | 3 2 _ tru ndRaintga<1T,, R efdlOap,g 1P,ro tdo,a CtOaL2L,_U NfRlOLaLg>2(;a rg s| ) ^~~~~; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :140203 | : 66 : note: uin instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested herei nt32_t data 1203 | , f l a g 1 ,R udnWaotrkaEl2e,m enftl().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.commIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ .buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: warning: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hinitializer order does not match the declaration order [-Wreorder-ctor] :667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | t i667d | ( ti d ) ,t nithd(rteiadds)(,n thntrheraedasds)(,n tthiredIadnsBl)o,c k(ttihrdeIandBIldxo.xc)k,(t hgrreoaudpI(dgxr.oxu)p,) ,g r ou| p ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~( g r| o tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ up), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h668: | 667 : 60 : snote: tefield 'group' will be initialized after field 'stepSize'p Size(stepSiz e_667 = | = 0 ? nctcildS(htmiedm).,c onmmt.bhufrfeSiazedss[(NnCCtL_hPrReOaTOd_sS)I,MP LtE]i/dNICCnLB_SlTEoPcSk/(sizteohfr(Te)a :d IsdtexpS.ixz)e_,) g{r o| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u p | ( group(groupg roup), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ y>, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlocIn file included from k/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ l, ty, redop, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hst:e667p:S15i:z warning: einitializer order does not match the declaration order [-Wreorder-ctor]_ == 0 ? ncclShmem.comm.buffSizes[N C667C | L _ P RtOiTdO(t_iSd)I, MnPtLhEr]ea/dNs(CnCtLh_reSaTdEs)P,S t/isdIinBzloeckof(T) : stepSize_() { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group threadIdx.x), group(g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hro:u34p:),7 : | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | 34 | s te pS i ze (pstrepiSmizse(_ t=i= d0, ? nncctlShhmerme.adcs,o m&mr.ibnug-f>fpSrizeevs,[ N&CrCLi_nPgR-O>nTexOt_S, IMaPrLgEs]-/N>sCeCnLd_SbTuEfPSf/,s iazreogfs(-T>)r e: cstvepbSuizfef_,) {a r | g ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~s - >| r group(groupe dOpArg, 0, args-/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h>:c34o:n7:n Inote: nin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here dex, args->connIndex )34; | | ^ prims(tid,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h n:t65hr:e5a:d snote: ,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here & ring->pr ev65, | &r i ng ->rnuenxRti, nagrgs,e ndRbeudffO,p a,r gPs-r>roectvobuf,f ,C aOrLgLs-_>UreNdROpOALrgL,> (0a, rarggss-)>c;o n n| I ^nd ex, args->connIndex)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h; : 203| ^: 66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: 203in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here | R65u | n W o rruknERilnegA(lagrgos,) ; P r| ^o to, COLL_UNROLL>()./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:r203:u66n:( note: win instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested heree ); | ^ 203 | Ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cppnW:or7k:E1l:e mnote: ein instantiation of member function 'RunWork, 1, 2, 4>::run' requested herent ((R).erudnu(wcee)S; c | a ^ tter_RING_SI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cppM:7P:L1E:_ note: Sin instantiation of member function 'RunWork, 1, 2, 4>::run' requested here um_f8, ncclFuncR e7d | DuEcFeINSEc_nacctlDteveFru,n cF(RuednucceSSucamt,te r_rRcINcGl__SIfMlPoLaE_tS8um,_ f8N, CncCcLlF_unAcLReGdOuc_eSRcaItNteGr,, NFuCnCcLS_uPm,R rOcTclO_f_loSaIt8M, PNCLCLE_)A L GO| _^R ING, NCCL_P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hRO:T409O_:SI52M:PL Enote: )expanded from macro 'DEFINE_ncclDevFunc' | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h409 | :409 : 52: note: Rexpanded from macro 'DEFINE_ncclDevFunc'u nWo 409r | k < c oRulnWlor,k >,, alagol, gporo,to , p4r>(o).toru,n( &4nc>c(lS)h.run(&ncmceml.Swohrmk)e;m \. w | o ^ rk); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | ti d(667t | id ), n thtrieadd(s(tnithdr)e,a dns)t,h triedaIndBslo(ckn(tthhrreaedaIddsx.)x,) t,i gdrIonuBp(lgorcoku(p)t,h r e| a ^~~~~~~~~~~~~~~~~d Idx./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hx:667):,60: note: gfield 'group' will be initialized after field 'stepSize'r oup(group), 667 | | ^~~~~~~~~~~~~~~~~ tid(t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hi:d667),: n60t:h rnote: eafield 'group' will be initialized after field 'stepSize'd s(nthreads), 667t | i dI n Bl otcki(dth(rteiaddId)x,.x )n,t ghrrouepa(dgsro(unpt)h, r e| a ^~~~~~~~~~~d s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlockIn file included from (thr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cppea:d2I: dIn file included from x/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:.10x: /In file included from WA/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hR:P167_S: IZ/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hE):, 667 | : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~15 : warning: | warp(tid/WARP_SIZEinitializer order does not match the declaration order [-Wreorder-ctor] 506 | flagThread((tid%4)==3), 667g | r o u p (tgirdo(utpi)d,) , | n ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~t h r| e warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3a ds(nthreads), 507t | i d I n BsltoecpkS(itzher(enacdcIldSxh.mxe)m,. cgormomu.pb(ugfrfoSuipz)e,s [ N| C ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~C L _| P tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_R OTO_LL128]/NCCL_ S668T | E P S / ssitzeepoSfi(zuei(nstt6e4p_Sti)z)e _{ = =| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~0 ?| group(groupn cclShmem.comm.buffSizes[NCCL_PROTO_SIMPL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hE:]34/:N7C:C Lnote: _in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested hereS TEPS/sizeof(T) : st e34p | S i z e _ ) p{r i m| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( t i| d group(group, nthreads, &ring->prev, &ring->next, args->sendbuff, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.har:g34s:-7>:r enote: cin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested herev buff, args->redOpArg ,34 | 0 , a r g sp-r>icmosn(ntIindd,e xn,t harregasd-s>,c o&nrniInngd-e>xp)r;e v ,| ^& ring->next,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h :a79r:g5s:- >note: sin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested heree ndbuff, a r79g | s - > r ercuvnbRuifnfg,< Ta,r gRse-d>Orpe,d OPprAortgo,L L01,2 8a,r gCsO-L>Lc_oUnNnRIOnLdLe>x(,a ragrsg)s;- > c| o ^n nIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hnote: :in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here65 :5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 203 | 65 | r uRnuRniWnogrP(raortgos,) ;C O L| L ^_ UNROLL>().run(we)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h;: 203 :| 66 ^: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp | : 5 : 1 : note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here RunWorkElementI(N)G._rLuLn1(2w8e_)S;u m _| f ^8 , ncclFuncRe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cppd:u7c:e1S: cnote: ain instantiation of member function 'RunWork, 1, 2, 2>::run' requested heret ter, FuncSum, rccl_ f7l | oDaEtF8I,N EN_CnCcLc_lADLeGvOF_uRnIcN(GR,e dNuCcCeLS_cPaRtOtTeOr__LRLI1N2G8_)S I M| P^L E_Sum_f8, n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hc:c406l:F52u:n cnote: expanded from macro 'DEFINE_ncclDevFunc'R educeScatter, FuncSu m406, | r c c lR_ufnlWooartk8<,c oNlClC,L _tAyL,G Or_eRdIoNpG<,t yN>C,C La_lPgRoO,T Op_rSoItMoP,L E2)> ( )| .^r un(&ncclSh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hm:e406m:.52w:o rnote: kexpanded from macro 'DEFINE_ncclDevFunc') ; \ | ^ 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h76: | 13 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h: 13 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h u:i76n:t183:2 _warning: tunused variable 'y' [-Wunused-variable] y, head, mantissa; | 76 ^ | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 9 warnings generated when compiling for gfx1100. 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.coIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, maIn file included from ntis/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpps:a1;: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:| 13: ^In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t dataIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flagIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: 9 warnings generated when compiling for gfx1201. note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.xIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ ->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long 9 warnings generated when compiling for host. log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1100. [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(RedIn file included from uce/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cppS:ca2t: tIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hr:_10R: IIn file included from NG/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h_:S167I: MP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hLE:_667S:u15m:P owarning: sinitializer order does not match the declaration order [-Wreorder-ctor]t Div_i8, ncclFuncReduceScatter, Fun c667S | um P o s ttDiidv(,t iidn)t,8 _ntt,h rNeCaCdLs_(AnLtGhOr_eRaIdNsG),, NtCiCdLI_nPBRlOoTcOk_(StIhMrPeLaEd)I d x| .^x ), group(g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hr:o406u:p52):, note: expanded from macro 'DEFINE_ncclDevFunc'| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 406 | RunW o668r | k < c o lslt,e ptSyi,z er(esdtoeppe,_ a=l=g o0, ?p rnoctcol,S h2m>e(m)..croumnm(.&bnucfcflSSihzmeesm[.NwCoCrLk_)P;R O\T O _| S ^I MPLE]/NCCL_STE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hP:S667/:s15i:z enote: ofield 'nthreads' will be initialized after field 'tidInBlock'f (T) : stepSi z667e | _ ) { t i| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( t i| d group(group ), nthreads(nthreads), tidInBlock/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h(:34t:h7r:e anote: din instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereI dx.x), group(group )34, | | ^~~~~~~~~~~~~~~~~ pri/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hm:s667(:t60i:d ,note: field 'group' will be initialized after field 'stepSize'n threads, &ri n667g | - > p r etvi,d (&triidn)g,- >nntehxrte,a dasr(gnst-h>rseeanddsb)u,f ft,i daIrngBsl-o>crke(ctvhbruefafd,I daxr.gxs)-,> rgerdoOuppA(rggr,o u0p,) ,a r g| s ^~~~~~~~~~~- >connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint3/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->In file included from recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().:r1: uIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:13(: In file included from &/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:n13: c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:c76:18l: Swarning: unused variable 'y' [-Wunused-variable]h me76m | . w o ruiknt)32;_t y\, he ad| , ^ma ntissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we);In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, ar | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Redugs->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tiid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatteIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ r, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ * ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSizeuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' comm. 406b | u f f S iRzuensW[oNrCkCL,_ SaTlEgPoS,/ spirzoetoof,( T2)> (:) .srtuenp(S&inzcec_l)S h{m em. w| o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r k )| ; group(group \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(thre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.had:I33d:x7.:x )note: , in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereg roup(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: 33note: | field 'group' will be initialized after field 'stepSize' prims(tid ,667 | n t h r etaidds(,t i&dr)i,n gn-t>hprreeavd,s (&nrtihnrge-a>dnse)x,t ,t iadrIgnsB-l>oscekn(dtbhurfefa,d Iadrxg.sx-)>,r egcrvobuupf(fg,r oaurpg)s,- > r| e ^~~~~~~~~~~d OpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | step/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp 10 warnings generated when compiling for gfx90a. [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa;In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2In file included from , fla/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: gIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from 2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h;:140:14 : warning: unused variable 'data1' [-Wunused-variable] | 140 | ^~~~~ uin t32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] In file included from 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 19: warning: unused variable 'ptr' [-Wunused-variable] 270 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp::22: : In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10:: In file included from 10/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h: :169In file included from : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:168:: 270/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:19:: 140warning: :unused variable 'ptr' [-Wunused-variable] 14: warning: unused variable 'data1' [-Wunused-variable] 270 | uint64_ t140* | pt r = r ecuviPtnrt(302)+_ltl 12d8aOftfas1et,; f| l ^~~ ag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | hreadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nOp, Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ ().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncRedIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0uce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RINGIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, ty>, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 9 warnings generated when compiling for gfx1102. 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128O: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ffset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+lIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ l128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ lgo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, nc 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, protoIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ , 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp [ 99%] Building CXX object CMakeFiles/rccl.dir/git_version.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT CMakeFiles/rccl.dir/git_version.cpp.o -MF CMakeFiles/rccl.dir/git_version.cpp.o.d -o CMakeFiles/rccl.dir/git_version.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/git_version.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &riIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ng->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ d(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.coup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ mem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ ^~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h :210:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 210 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128, 2>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 1, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:222:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 222 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:210:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 210 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, LE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:222:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 222 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1200. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1100. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1200. 11 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx1200. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx1101. 11 warnings generated when compiling for gfx1201. 9 warnings generated when compiling for gfx1200. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx90a. [100%] Linking CXX shared library librccl.so /usr/bin/cmake -E cmake_link_script CMakeFiles/rccl.dir/link.txt --verbose=1 /usr/bin/cmake -E time /usr/bin/hipcc -fPIC -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -parallel-jobs=1 -Xoffload-linker -mllvm=-amdgpu-kernarg-preload-count=16 -Xlinker --dependency-file=CMakeFiles/rccl.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,librccl.so.1 -o librccl.so.1.0 CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o CMakeFiles/rccl.dir/hipify/src/channel.cc.o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o CMakeFiles/rccl.dir/hipify/src/debug.cc.o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o CMakeFiles/rccl.dir/hipify/src/group.cc.o CMakeFiles/rccl.dir/hipify/src/init.cc.o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o CMakeFiles/rccl.dir/hipify/src/net.cc.o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o CMakeFiles/rccl.dir/hipify/src/register.cc.o CMakeFiles/rccl.dir/hipify/src/transport.cc.o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gclang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] Elapsed time (seconds): 4334.07 ensrc/reduce_scatter_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o CMakeFiles/rccl.dir/git_version.cpp.o -fgpu-rdc -ldl /usr/lib64/librocm_smi64.so.1.0 /usr/lib64/libamdhip64.so.6.3.42133 --hip-link --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1200 --offload-arch=gfx1201 -lpthread -lrt -ldl /usr/bin/cmake -E cmake_symlink_library librccl.so.1.0 librccl.so.1 librccl.so gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [100%] Built target rccl gmake[1]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles 0 + RPM_EC=0 ++ jobs -p + exit 0 Executing(%install): /bin/sh -e /var/tmp/rpm-tmp.0o5icx + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + '[' /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT '!=' / ']' + rm -rf /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT ++ dirname /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT + mkdir -p /builddir/build/BUILD/rccl-6.3.0-build + mkdir /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd rccl-rocm-6.3.0 + DESTDIR=/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT + /usr/bin/cmake --install redhat-linux-build -- Install configuration: "RelWithDebInfo" -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/librccl.so.1.0 -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/librccl.so.1 -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/librccl.so -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/include/rccl/rccl.h -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/include/rccl/nccl_net.h -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/include/rccl/amd_detail/api_trace.h -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-32tb-op.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-32tb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-64tb-op.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-64tb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple-op.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple_2.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-0-9kb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-190kb-512kb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-512kb-7mb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-7mb-43mb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-9kb-190kb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll128.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-simple.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-targets.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-targets-relwithdebinfo.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-config.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-config-version.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt + echo s@/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT@@ + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.so.*.[0-9]' + sed -f br.sed + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.so.[0-9]' + sed -f br.sed + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.so' + sed -f br.sed + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.cmake' + sed -f br.sed + '[' -f /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt ']' + rm /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt + /usr/bin/find-debuginfo -j6 --strict-build-id -m -i --build-id-seed 6.3.0-3.fc42 --unique-debug-suffix -6.3.0-3.fc42.x86_64 --unique-debug-src-base rccl-6.3.0-3.fc42.x86_64 --run-dwz --dwz-low-mem-die-limit 10000000 --dwz-max-die-limit 110000000 -S debugsourcefiles.list /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 find-debuginfo: starting Extracting debug info from 1 files DWARF-compressing 1 files dwz: ./usr/lib64/librccl.so.1.0-6.3.0-3.fc42.x86_64.debug: Unknown debugging section .debug_str_offsets sepdebugcrcfix: Updated 0 CRC32s, 1 CRC32s did match. Creating .debug symlinks for symlinks to ELF files Copying sources found by 'debugedit -l' to /usr/src/debug/rccl-6.3.0-3.fc42.x86_64 find-debuginfo: done + /usr/lib/rpm/check-buildroot + /usr/lib/rpm/redhat/brp-ldconfig + /usr/lib/rpm/brp-compress + /usr/lib/rpm/redhat/brp-strip-lto /usr/bin/strip + /usr/lib/rpm/brp-strip-static-archive /usr/bin/strip + /usr/lib/rpm/check-rpaths + /usr/lib/rpm/redhat/brp-mangle-shebangs + /usr/lib/rpm/brp-remove-la-files + env /usr/lib/rpm/redhat/brp-python-bytecompile '' 1 0 -j6 + /usr/lib/rpm/redhat/brp-python-hardlink + /usr/bin/add-determinism --brp -j6 /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT Scanned 38 directories and 313 files, processed 0 inodes, 0 modified (0 replaced + 0 rewritten), 0 unsupported format, 0 errors Reading /builddir/build/BUILD/rccl-6.3.0-build/SPECPARTS/rpm-debuginfo.specpart Processing files: rccl-6.3.0-3.fc42.x86_64 Executing(%license): /bin/sh -e /var/tmp/rpm-tmp.opoi9k + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + cd rccl-rocm-6.3.0 + LICENSEDIR=/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/licenses/rccl + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export LICENSEDIR + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/licenses/rccl + cp -pr /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/LICENSE.txt /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/licenses/rccl + RPM_EC=0 ++ jobs -p + exit 0 Provides: librccl.so.1()(64bit) rccl = 6.3.0-3.fc42 rccl(x86-64) = 6.3.0-3.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires: ld-linux-x86-64.so.2()(64bit) ld-linux-x86-64.so.2(GLIBC_2.3)(64bit) libamdhip64.so.6()(64bit) libamdhip64.so.6(hip_4.2)(64bit) libamdhip64.so.6(hip_4.3)(64bit) libamdhip64.so.6(hip_4.5)(64bit) libamdhip64.so.6(hip_5.0)(64bit) libamdhip64.so.6(hip_5.3)(64bit) libamdhip64.so.6(hip_6.0)(64bit) libc.so.6()(64bit) libc.so.6(GLIBC_2.10)(64bit) libc.so.6(GLIBC_2.14)(64bit) libc.so.6(GLIBC_2.16)(64bit) libc.so.6(GLIBC_2.17)(64bit) libc.so.6(GLIBC_2.2.5)(64bit) libc.so.6(GLIBC_2.3)(64bit) libc.so.6(GLIBC_2.3.2)(64bit) libc.so.6(GLIBC_2.3.4)(64bit) libc.so.6(GLIBC_2.32)(64bit) libc.so.6(GLIBC_2.33)(64bit) libc.so.6(GLIBC_2.34)(64bit) libc.so.6(GLIBC_2.38)(64bit) libc.so.6(GLIBC_2.4)(64bit) libc.so.6(GLIBC_2.6)(64bit) libc.so.6(GLIBC_2.7)(64bit) libc.so.6(GLIBC_ABI_DT_RELR)(64bit) libgcc_s.so.1()(64bit) libgcc_s.so.1(GCC_12.0.0)(64bit) libgcc_s.so.1(GCC_3.0)(64bit) libm.so.6()(64bit) libm.so.6(GLIBC_2.2.5)(64bit) librocm_smi64.so.1()(64bit) libstdc++.so.6()(64bit) libstdc++.so.6(CXXABI_1.3)(64bit) libstdc++.so.6(CXXABI_1.3.7)(64bit) libstdc++.so.6(GLIBCXX_3.4)(64bit) libstdc++.so.6(GLIBCXX_3.4.11)(64bit) libstdc++.so.6(GLIBCXX_3.4.18)(64bit) libstdc++.so.6(GLIBCXX_3.4.19)(64bit) libstdc++.so.6(GLIBCXX_3.4.21)(64bit) libstdc++.so.6(GLIBCXX_3.4.22)(64bit) libstdc++.so.6(GLIBCXX_3.4.26)(64bit) libstdc++.so.6(GLIBCXX_3.4.29)(64bit) libstdc++.so.6(GLIBCXX_3.4.30)(64bit) libstdc++.so.6(GLIBCXX_3.4.32)(64bit) libstdc++.so.6(GLIBCXX_3.4.9)(64bit) Processing files: rccl-devel-6.3.0-3.fc42.x86_64 Executing(%doc): /bin/sh -e /var/tmp/rpm-tmp.2ouJoY + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + cd rccl-rocm-6.3.0 + DOCDIR=/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl-devel + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export DOCDIR + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl-devel + cp -pr /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/README.md /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl-devel + RPM_EC=0 ++ jobs -p + exit 0 Provides: cmake(rccl) = 2.21.5 rccl-devel = 6.3.0-3.fc42 rccl-devel(x86-64) = 6.3.0-3.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires: cmake-filesystem(x86-64) librccl.so.1()(64bit) Processing files: rccl-data-6.3.0-3.fc42.noarch Provides: rccl-data = 6.3.0-3.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Processing files: rccl-debugsource-6.3.0-3.fc42.x86_64 Provides: rccl-debugsource = 6.3.0-3.fc42 rccl-debugsource(x86-64) = 6.3.0-3.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Processing files: rccl-debuginfo-6.3.0-3.fc42.x86_64 Provides: debuginfo(build-id) = 44ca611e7aedb4322853d426472e8fc7d61a093d librccl.so.1.0-6.3.0-3.fc42.x86_64.debug()(64bit) rccl-debuginfo = 6.3.0-3.fc42 rccl-debuginfo(x86-64) = 6.3.0-3.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Recommends: rccl-debugsource(x86-64) = 6.3.0-3.fc42 Checking for unpackaged file(s): /usr/lib/rpm/check-files /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT Wrote: /builddir/build/RPMS/rccl-devel-6.3.0-3.fc42.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-debugsource-6.3.0-3.fc42.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-debuginfo-6.3.0-3.fc42.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-data-6.3.0-3.fc42.noarch.rpm Wrote: /builddir/build/RPMS/rccl-6.3.0-3.fc42.x86_64.rpm Child return code was: 0